npm - nexo-brain - Versions diffs - 7.31.13 → 7.33.0 - Mend

nexo-brain 7.31.13 → 7.33.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/.claude-plugin/plugin.json +1 -1
package/README.md +1 -1
package/package.json +1 -1
package/src/auto_close_sessions.py +38 -0
package/src/cognitive/_search.py +13 -2
package/src/consolidation_prep.py +380 -0
package/src/crons/sync.py +14 -7
package/src/db/__init__.py +3 -0
package/src/db/_memory_v2.py +276 -0
package/src/db/_schema.py +134 -0
package/src/hooks/auto_capture.py +60 -18
package/src/learning_resolver.py +42 -0
package/src/local_context/api.py +237 -33
package/src/local_context/db.py +3 -2
package/src/memory_retrieval.py +96 -7
package/src/plugins/protocol.py +71 -24
package/src/pre_answer_router.py +116 -6
package/src/scripts/nexo-followup-runner.py +110 -8
package/src/scripts/nexo-postmortem-consolidator.py +44 -1
package/src/tools_sessions.py +1 -1
package/templates/core-prompts/postmortem-consolidator.md +29 -2

package/.claude-plugin/plugin.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "nexo-brain",
-  "version": "7.31.13",
+  "version": "7.33.0",
   "description": "Local cognitive runtime for Claude Code \u2014 persistent memory, overnight learning, doctor diagnostics, personal scripts, recovery-aware jobs, startup preflight, and optional dashboard/power helper.",
   "author": {
     "name": "NEXO Brain",

package/README.md CHANGED Viewed

@@ -18,7 +18,7 @@
 [Watch the overview video](https://nexo-brain.com/watch/) · [Watch on YouTube](https://www.youtube.com/watch?v=i2lkGhKyVqI) · [Open the infographic](https://nexo-brain.com/assets/nexo-brain-infographic-v5.png)
-Version `7.31.13` is the current packaged-runtime line. Patch release over v7.31.12 - the offline wheel bundle no longer hard-pins onnxruntime, so cross-platform/offline installs (including older Linux) resolve a compatible native wheel instead of failing. Version `7.31.11` was a patch release over v7.31.10 - MCP lifecycle robustness + guardrail precision.
+Version `7.33.0` is the current packaged-runtime line. Minor release - Cognitive OS Ola 1 (phase 2): memory search now finds by MEANING (observation embeddings + FTS/vector fusion), the KG/causal graph is read at answer time (kg_neighbors pre-answer source), local files are recalled via FTS5, nightly learning consolidation no longer times out, correction capture is reliable (soft), and the followup runner uses an atomic lock. Builds on v7.32.0 (causal-graph populate + workflow reaper + the 7.31.14 critical fixes).
 Previously in `7.31.9`: patch release over v7.31.8 - UI release closeout now has to prove the original reported symptom was reopened with observable evidence before claiming the release is ready.

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "nexo-brain",
-  "version": "7.31.13",
+  "version": "7.33.0",
   "mcpName": "io.github.wazionapps/nexo",
   "description": "NEXO Brain — Shared brain for AI agents. Persistent memory, semantic RAG, natural forgetting, metacognitive guard, trust scoring, 150+ MCP tools. Works with Claude Code, Codex, Claude Desktop & any MCP client. 100% local, free.",
   "homepage": "https://nexo-brain.com",

package/src/auto_close_sessions.py CHANGED Viewed

@@ -182,6 +182,43 @@ def auto_close_open_protocol_tasks(conn, sid: str, task: str = "") -> list[str]:
     return closed
+def auto_close_abandoned_workflow_runs(conn, sid: str) -> dict:
+    """Reap durable workflow_runs / workflow_goals abandoned by a stale session.
+    auto_close only reaped protocol_tasks; a session that opened a durable
+    workflow_run / workflow_goal and never closed it left a zombie 'running'
+    row forever, polluting the resume surface (M10 gap). Move non-terminal ones
+    to a terminal state when their owning session is reaped. closed_at/updated_at
+    use datetime('now') to match the workflow tables' timestamp format.
+    """
+    note = "auto-close: stale session ended without explicit workflow close"
+    runs = conn.execute(
+        "SELECT run_id FROM workflow_runs "
+        "WHERE session_id = ? AND status IN ('open','running','blocked','waiting_approval')",
+        (sid,),
+    ).fetchall()
+    for row in runs:
+        conn.execute(
+            "UPDATE workflow_runs SET status='cancelled', next_action=?, "
+            "closed_at=datetime('now'), updated_at=datetime('now') "
+            "WHERE run_id=? AND status IN ('open','running','blocked','waiting_approval')",
+            (note, row["run_id"]),
+        )
+    goals = conn.execute(
+        "SELECT goal_id FROM workflow_goals "
+        "WHERE session_id = ? AND status IN ('active','blocked')",
+        (sid,),
+    ).fetchall()
+    for row in goals:
+        conn.execute(
+            "UPDATE workflow_goals SET status='abandoned', blocker_reason=?, "
+            "closed_at=datetime('now'), updated_at=datetime('now') "
+            "WHERE goal_id=? AND status IN ('active','blocked')",
+            (note, row["goal_id"]),
+        )
+    return {"runs": len(runs), "goals": len(goals)}
 def main():
     init_db()
     conn = get_db()
@@ -197,6 +234,7 @@ def main():
         draft = get_diary_draft(sid)
         closed_tasks = auto_close_open_protocol_tasks(conn, sid, task=session.get("task", ""))
         closed_task_ids.extend(closed_tasks)
+        auto_close_abandoned_workflow_runs(conn, sid)
         if draft:
             promote_draft_to_diary(sid, draft, task=session.get("task", ""))

package/src/cognitive/_search.py CHANGED Viewed

@@ -784,8 +784,19 @@ CO_ACTIVATION_MIN_STRENGTH = 0.1
 def _canonical_co_id(store: str, mid: int) -> int:
-    """Create a canonical hash ID for co-activation tracking."""
-    return hash(f"{store}:{mid}") % (2**31)
+    """Create a canonical, PROCESS-STABLE hash ID for co-activation tracking.
+    MUST be deterministic across processes. Python's builtin hash() is salted
+    per process (PYTHONHASHSEED), so co-activation links written in one MCP
+    process never matched the same memory's id in the next — fragmenting the
+    associative graph (observed ~6x distinct ids per memory) and silently
+    degrading spreading activation to within-a-single-process-lifetime. blake2b
+    is stable across processes and runs.
+    """
+    import hashlib
+    digest = hashlib.blake2b(f"{store}:{mid}".encode("utf-8"), digest_size=8).digest()
+    return int.from_bytes(digest, "big") % (2**31)
 def record_co_activation(memory_ids: list[tuple[str, int]]):

package/src/consolidation_prep.py ADDED Viewed

@@ -0,0 +1,380 @@
+from __future__ import annotations
+"""Read-only consolidation brief builder for the nightly postmortem.
+Why this module exists
+----------------------
+The nightly postmortem consolidator hands the LLM a tiny diary slice, but the
+prompt's "do not duplicate / detect contradiction" steps used to make the
+headless model pull the ENTIRE learnings corpus into its own context (via
+nexo_learning_list / nexo_learning_search / reading MEMORY.md). At hundreds of
+learnings the working context blows up and the timeout wrapper SIGKILLs the
+session (exit 124).
+The fix: precompute ALL corpus-wide MECHANICAL work here, in the consolidator
+SCRIPT process, and feed the LLM only a small, hard-capped JSON brief. The LLM
+keeps the SEMANTIC judgment it is uniquely good at (is this self-critique worth
+a permanent rule? which precomputed contradiction is real and how to phrase the
+canonical rule?) and loses every task that requires scanning the whole corpus.
+This module is READ-ONLY by construction: it performs SELECT-only queries on its
+own short-lived sqlite connection (mirrors apply_findings connection style) and
+NEVER commits, inserts, updates, or deletes. The only single source of truth for
+similarity / contradiction / dedup math remains learning_resolver — this module
+depends only on its PUBLIC surface.
+"""
+import json
+import os
+import sqlite3
+from typing import Any
+import learning_resolver
+try:  # paths is available in the runtime; keep import defensive for odd installs
+    import paths as _paths
+except Exception:  # pragma: no cover - defensive
+    _paths = None
+# Read learnings in bounded batches so even a 5k-row corpus stays O(n) and the
+# helper itself never holds the whole textual corpus in a single prompt — it only
+# emits the capped brief below.
+_CHUNK = 200
+# A learning is "weak" (stale candidate) when its weight is low, OR it lacks both
+# reasoning and prevention (no rationale to act on), OR it claims a file scope but
+# was never reinforced by a guard hit. Mirrors apply_findings weak-learning logic;
+# copied here as small local predicates rather than importing apply_findings (to
+# avoid that module's _DynamicPath side effects).
+_WEAK_WEIGHT = 1.0
+def _resolve_db_path() -> str:
+    for env_key in ("NEXO_TEST_DB", "NEXO_DB"):
+        value = str(os.environ.get(env_key, "") or "").strip()
+        if value:
+            return value
+    if _paths is not None:
+        try:
+            return str(_paths.resolve_db_path())
+        except Exception:
+            pass
+    return ""
+def _open_conn() -> sqlite3.Connection | None:
+    db_path = _resolve_db_path()
+    if not db_path or not os.path.isfile(db_path):
+        return None
+    try:
+        conn = sqlite3.connect(db_path, timeout=30)
+        conn.row_factory = sqlite3.Row
+        return conn
+    except Exception:
+        return None
+def _table_columns(conn: sqlite3.Connection, table: str) -> set[str]:
+    try:
+        return {str(row[1]) for row in conn.execute(f"PRAGMA table_info({table})").fetchall()}
+    except Exception:
+        return set()
+def _preview(text: str, limit: int = 160) -> str:
+    clean = " ".join(str(text or "").split())
+    if len(clean) > limit:
+        return clean[: limit - 1].rstrip() + "…"
+    return clean
+def _slugify(text: str) -> str:
+    normalized = learning_resolver._normalize_text(text)
+    tokens = [tok for tok in normalized.replace("/", " ").split() if tok]
+    return "-".join(tokens[:8])[:80] or "topic"
+def _critique_text(diary: dict[str, Any]) -> str:
+    parts = [
+        str(diary.get("self_critique") or ""),
+        str(diary.get("summary") or ""),
+    ]
+    return " ".join(part for part in parts if part).strip()
+def _is_weak(row: dict[str, Any], columns: set[str]) -> str:
+    """Return a non-empty weakness reason if the learning looks stale/weak."""
+    if "weight" in columns:
+        try:
+            weight = float(row.get("weight") if row.get("weight") is not None else 0.5)
+        except Exception:
+            weight = 0.5
+        if weight < _WEAK_WEIGHT:
+            return f"low_weight ({round(weight, 2)})"
+    reasoning = str(row.get("reasoning") or "").strip()
+    prevention = str(row.get("prevention") or "").strip()
+    if not reasoning and not prevention:
+        return "no_reasoning_or_prevention"
+    if "applies_to" in columns and "guard_hits" in columns:
+        applies = str(row.get("applies_to") or "").strip()
+        try:
+            guard_hits = int(row.get("guard_hits") or 0)
+        except Exception:
+            guard_hits = 0
+        if applies and guard_hits == 0:
+            return "scoped_never_guard_hit"
+    return ""
+def _iter_active_learnings(conn: sqlite3.Connection, columns: set[str]):
+    """Yield active learnings dicts in bounded LIMIT/OFFSET batches."""
+    status_filter = " WHERE COALESCE(status, 'active') = 'active'" if "status" in columns else ""
+    order_by = "updated_at DESC, id DESC" if "updated_at" in columns else "id DESC"
+    offset = 0
+    while True:
+        try:
+            rows = conn.execute(
+                f"SELECT * FROM learnings{status_filter} ORDER BY {order_by} LIMIT ? OFFSET ?",
+                (_CHUNK, offset),
+            ).fetchall()
+        except Exception:
+            return
+        if not rows:
+            return
+        for row in rows:
+            yield dict(row)
+        if len(rows) < _CHUNK:
+            return
+        offset += _CHUNK
+def build_consolidation_brief(
+    diaries_with_critique: list[dict],
+    *,
+    conn: sqlite3.Connection | None = None,
+    max_chars: int = 6000,
+    max_shortlist: int = 25,
+    max_contradictions: int = 15,
+    max_stale: int = 15,
+) -> dict:
+    """Build a small, hard-capped JSON brief from today's critiques + the corpus.
+    READ-ONLY: opens its own short-lived connection (unless one is supplied),
+    performs only SELECT queries, and never commits. The brief is the ONLY thing
+    handed to the LLM, so the model never lists the whole corpus.
+    """
+    own_conn = conn is None
+    if own_conn:
+        conn = _open_conn()
+    brief: dict[str, Any] = {
+        "corpus_size": 0,
+        "today_topics": [],
+        "shortlist": [],
+        "contradiction_pairs": [],
+        "supersession_stubs": [],
+        "stale_candidates": [],
+        "preference_key_dupes": [],
+        "truncated": False,
+    }
+    # Build today's topics regardless of corpus availability.
+    today_topics: list[dict[str, Any]] = []
+    for diary in diaries_with_critique or []:
+        text = _critique_text(diary)
+        if not text:
+            continue
+        title = _preview(diary.get("summary") or diary.get("self_critique") or "", 120)
+        today_topics.append(
+            {
+                "slug": _slugify(diary.get("summary") or diary.get("self_critique") or ""),
+                "title": title,
+                "_text": text,
+                "_tokens": set(learning_resolver._tokenize(text)),
+                "_applies": str(diary.get("domain") or ""),
+                "has_existing_coverage": False,
+                "covering_ids": [],
+            }
+        )
+    if conn is None:
+        # No corpus available (fresh install / missing DB). Emit topics only.
+        brief["today_topics"] = [
+            {
+                "slug": t["slug"],
+                "title": t["title"],
+                "has_existing_coverage": False,
+                "covering_ids": [],
+            }
+            for t in today_topics
+        ]
+        return brief
+    try:
+        columns = _table_columns(conn, "learnings")
+        if not columns:
+            brief["today_topics"] = [
+                {
+                    "slug": t["slug"],
+                    "title": t["title"],
+                    "has_existing_coverage": False,
+                    "covering_ids": [],
+                }
+                for t in today_topics
+            ]
+            return brief
+        corpus_size = 0
+        shortlist: list[dict[str, Any]] = []
+        contradiction_pairs: list[dict[str, Any]] = []
+        stale_candidates: list[dict[str, Any]] = []
+        key_buckets: dict[str, list[int]] = {}
+        seen_shortlist_ids: set[int] = set()
+        for row in _iter_active_learnings(conn, columns):
+            corpus_size += 1
+            row_id = int(row.get("id") or 0)
+            row_title = str(row.get("title") or "")
+            row_content = str(row.get("content") or "")
+            row_applies = str(row.get("applies_to") or "")
+            row_text = f"{row_title} {row_content}".strip()
+            # (5) preference-key dedup — collapse colliding normalized keys.
+            key = learning_resolver.normalized_key(row_title, row_applies)
+            if key:
+                key_buckets.setdefault(key, []).append(row_id)
+            # (4) stale shortlist — weak/low-weight/never-guard-hit actives.
+            if len(stale_candidates) < max_stale:
+                weakness = _is_weak(row, columns)
+                if weakness:
+                    stale_candidates.append(
+                        {"id": row_id, "title": _preview(row_title, 120), "weakness": weakness}
+                    )
+            # Relevance vs today's topics drives shortlist + coverage + contradiction.
+            relevant_to: list[dict[str, Any]] = []
+            for topic in today_topics:
+                related = bool(topic["_tokens"] & set(learning_resolver._tokenize(row_text)))
+                scoped = bool(
+                    topic["_applies"]
+                    and row_applies
+                    and learning_resolver.applies_overlap(row_applies, topic["_applies"])
+                )
+                if not (related or scoped):
+                    continue
+                sim = learning_resolver.candidate_similarity(topic["_text"], row_text)
+                if sim >= 0.55 or scoped:
+                    relevant_to.append(topic)
+                    if row_id:
+                        topic["has_existing_coverage"] = True
+                        # Cap example covering ids so a topic covered by hundreds of
+                        # rules cannot balloon the brief; the boolean flag is what
+                        # the LLM acts on.
+                        if row_id not in topic["covering_ids"] and len(topic["covering_ids"]) < 10:
+                            topic["covering_ids"].append(row_id)
+                # (6) contradiction pairs vs today-topics.
+                if len(contradiction_pairs) < max_contradictions and learning_resolver.looks_contradictory(
+                    row_text, topic["_text"]
+                ):
+                    contradiction_pairs.append(
+                        {
+                            "existing_id": row_id,
+                            "existing_title": _preview(row_title, 120),
+                            "with": "today_topic",
+                            "snippet_a": _preview(row_text, 160),
+                            "snippet_b": _preview(topic["_text"], 160),
+                            "similarity": round(float(sim), 4),
+                        }
+                    )
+            if relevant_to and len(shortlist) < max_shortlist and row_id not in seen_shortlist_ids:
+                seen_shortlist_ids.add(row_id)
+                shortlist.append(
+                    {
+                        "id": row_id,
+                        "title": _preview(row_title, 120),
+                        "category": str(row.get("category") or ""),
+                        "applies_to": row_applies,
+                        "content_preview": _preview(row_content, 160),
+                    }
+                )
+        # (5) preference-key dupes — only keys with 2+ colliding ids. Cap both the
+        # number of dupe groups and the ids listed per group so a pathological
+        # corpus (hundreds of identical-title rules) cannot balloon the brief.
+        preference_key_dupes = []
+        for key, ids in key_buckets.items():
+            if len(ids) <= 1:
+                continue
+            preference_key_dupes.append({"key": key, "ids": ids[:10], "total": len(ids)})
+            if len(preference_key_dupes) >= max_stale:
+                break
+        # (3) supersession stubs — today-topics that already have higher-authority
+        # coverage are candidates to be replaced by a canonical rule.
+        supersession_stubs: list[dict[str, Any]] = []
+        for topic in today_topics:
+            for old_id in topic["covering_ids"][:1]:
+                supersession_stubs.append(
+                    {
+                        "old_id": old_id,
+                        "old_title": next(
+                            (s["title"] for s in shortlist if s["id"] == old_id),
+                            "",
+                        ),
+                        "reason": f"today topic '{topic['slug']}' may replace existing rule #{old_id}",
+                    }
+                )
+        brief["corpus_size"] = corpus_size
+        brief["today_topics"] = [
+            {
+                "slug": t["slug"],
+                "title": t["title"],
+                "has_existing_coverage": bool(t["has_existing_coverage"]),
+                "covering_ids": list(t["covering_ids"]),
+            }
+            for t in today_topics
+        ]
+        brief["shortlist"] = shortlist
+        brief["contradiction_pairs"] = contradiction_pairs
+        brief["supersession_stubs"] = supersession_stubs
+        brief["stale_candidates"] = stale_candidates
+        brief["preference_key_dupes"] = preference_key_dupes
+    finally:
+        if own_conn:
+            try:
+                conn.close()
+            except Exception:
+                pass
+    # Enforce max_chars: drop lowest-priority items until the serialized brief is
+    # under budget. Stale candidates and supersession stubs are the first to go,
+    # then contradiction pairs (least relevant first), then shortlist tail.
+    def _size() -> int:
+        return len(json.dumps(brief, ensure_ascii=False))
+    if _size() > max_chars:
+        brief["truncated"] = True
+        trim_order = ("preference_key_dupes", "supersession_stubs", "stale_candidates")
+        for field in trim_order:
+            while brief[field] and _size() > max_chars:
+                brief[field].pop()
+        while len(brief["contradiction_pairs"]) > 1 and _size() > max_chars:
+            brief["contradiction_pairs"].pop()
+        while len(brief["shortlist"]) > 1 and _size() > max_chars:
+            brief["shortlist"].pop()
+        # Last resort: trim contradiction/shortlist to empty-ish.
+        while brief["contradiction_pairs"] and _size() > max_chars:
+            brief["contradiction_pairs"].pop()
+        while brief["shortlist"] and _size() > max_chars:
+            brief["shortlist"].pop()
+    return brief
+__all__ = ["build_consolidation_brief"]

package/src/crons/sync.py CHANGED Viewed

@@ -727,13 +727,18 @@ def install_plist(label: str, plist: dict, plist_path: Path, dry_run: bool):
         log(f"  DRY-RUN: would install {plist_path.name}")
         return
-    with open(plist_path, "wb") as f:
-        plistlib.dump(plist, f)
+    # Ephemeral/test runtimes (temp NEXO_HOME or HOME, e.g. a pytest run) must
+    # NOT touch the operator's real ~/Library/LaunchAgents. The guard is checked
+    # BEFORE writing the plist file: otherwise a test run rewrites the real
+    # plists with temp-dir ProgramArguments, and one reboot/reload silently
+    # kills the whole consolidation cron fleet (cron-fleet-drift incident).
     if not launchctl_side_effects_allowed():
-        log(f"  Installed but skipped launchctl in ephemeral runtime: {plist_path.name}")
+        log(f"  Skipped plist write in ephemeral runtime: {plist_path.name}")
         return
+    with open(plist_path, "wb") as f:
+        plistlib.dump(plist, f)
     result = reload_launchagent_plist(plist_path, label=label)
     if result.get("action") == "skipped-ephemeral-runtime":
         log(f"  Installed but skipped launchctl in ephemeral runtime: {plist_path.name}")
@@ -751,8 +756,8 @@ def unload_plist(plist_path: Path, dry_run: bool):
         return
     if not launchctl_side_effects_allowed():
-        plist_path.unlink(missing_ok=True)
-        log(f"  Removed without launchctl in ephemeral runtime: {plist_path.name}")
+        # Ephemeral/test runtime: never delete the operator's real plists.
+        log(f"  Skipped plist removal in ephemeral runtime: {plist_path.name}")
         return
     result = unload_launchagent_plist(plist_path)
@@ -830,7 +835,9 @@ def sync(dry_run: bool = False):
         return
     LOG_DIR.mkdir(parents=True, exist_ok=True)
-    LAUNCH_AGENTS_DIR.mkdir(parents=True, exist_ok=True)
+    # In an ephemeral/test runtime, do not even create the real LaunchAgents dir.
+    if launchctl_side_effects_allowed():
+        LAUNCH_AGENTS_DIR.mkdir(parents=True, exist_ok=True)
     manifest_crons = load_manifest()
     manifest_ids = {c["id"] for c in manifest_crons}

package/src/db/__init__.py CHANGED Viewed

@@ -106,6 +106,9 @@ from db._memory_v2 import (
     list_memory_observations,
     search_memory_observations_fts,
     backfill_memory_observations,
+    backfill_observation_embeddings,
+    vector_scan_observations,
+    get_memory_observations_by_uids,
     memory_observation_health,
     maintain_memory_observations,
     memory_observation_stats,