npm - nexo-brain - Versions diffs - 0.2.1 → 0.3.2 - Mend

nexo-brain 0.2.1 → 0.3.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/README.md +158 -72
package/bin/nexo-brain 2.js +610 -0
package/package.json +2 -2
package/scripts/pre-commit-check 2.sh +55 -0
package/src/cognitive.py +1582 -56
package/src/db.py +49 -25
package/src/hooks/auto_capture.py +208 -0
package/src/plugins/cognitive_memory.py +276 -17
package/src/scripts/nexo-catchup.py +32 -15
package/src/scripts/nexo-cognitive-decay.py +2 -4
package/src/scripts/nexo-daily-self-audit.py +148 -29
package/src/scripts/nexo-immune.py +869 -0
package/src/scripts/nexo-postmortem-consolidator.py +42 -40
package/src/scripts/nexo-sleep.py +90 -39
package/src/scripts/nexo-synthesis.py +78 -76
package/src/tools_sessions.py +2 -2
package/templates/CLAUDE.md 2.template +89 -0
package/templates/CLAUDE.md.template +1 -1

package/src/db.py CHANGED Viewed

@@ -7,20 +7,16 @@ import secrets
 import string
 import datetime
 import pathlib
-from pathlib import Path
-NEXO_HOME = Path(os.environ.get("NEXO_HOME", str(Path.home() / ".nexo")))
-NEXO_HOME.mkdir(parents=True, exist_ok=True)
 DB_PATH = os.environ.get(
     "NEXO_TEST_DB",
     os.environ.get(
         "NEXO_DB",
-        str(NEXO_HOME / "nexo.db"),
+        os.path.join(os.path.dirname(os.path.abspath(__file__)), "nexo.db"),
     ),
 )
-# TTLs in seconds
+# TTLs in seconds (match session-coord.sh behavior)
 SESSION_STALE_SECONDS = 900    # 15 min (documented TTL)
 MESSAGE_TTL_SECONDS = 3600     # 1 hour
 QUESTION_TTL_SECONDS = 600     # 10 min
@@ -369,23 +365,25 @@ def init_db():
 # ── FTS5 Unified Search ──────────────────────────────────────────
-# Directories to index for unified search (uses NEXO_HOME)
+# Directories to index for unified search
 _FTS_MD_DIRS = [
-    str(NEXO_HOME / "docs"),
-    str(NEXO_HOME / "projects"),
-    str(NEXO_HOME / "memory"),
-    str(NEXO_HOME / "operations"),
-    str(NEXO_HOME / "learnings"),
-    str(NEXO_HOME / "brain"),
-    str(NEXO_HOME / "agents"),
-    str(NEXO_HOME / "skills"),
+    os.path.expanduser("~/claude/docs"),
+    os.path.expanduser("~/claude/projects"),
+    os.path.expanduser("~/claude/memory"),
+    os.path.expanduser("~/claude/operations"),
+    os.path.expanduser("~/claude/learnings"),
+    os.path.expanduser("~/claude/brain"),
+    os.path.expanduser("~/claude/agents"),
+    os.path.expanduser("~/claude/skills"),
+]
+# Code repos: index source files (skip vendor, node_modules, etc.)
+_FTS_CODE_DIRS = [
+    (os.path.expanduser("~/Documents/_PhpstormProjects"), ["*.php", "*.js", "*.json", "*.py", "*.ts", "*.tsx"]),
 ]
-# Code repos: populated via nexo_index_add_dir tool or NEXO_HOME/repos
-_FTS_CODE_DIRS = []
 _FTS_CODE_SKIP = {
     "vendor", "node_modules", ".git", "cache", "tmp", "logs", "uploads",
     "assets/img", "assets/fonts", ".next", "dist", "build", ".prisma",
-    "public/build", ".turbo", "__pycache__",
+    "PROYECTOS ANTIGUOS", "public/build", ".turbo", "__pycache__",
     "coverage", ".nyc_output", "storage/framework", "bootstrap/cache",
 }
 _FTS_MAX_FILE_SIZE = 50_000  # skip .md files >50KB
@@ -1194,7 +1192,13 @@ def update_followup(id: str, **kwargs) -> dict:
 def _calc_next_recurrence_date(recurrence: str, current_date: str = None) -> str:
-    """Calculate the next date for a recurring followup."""
+    """Calculate the next date for a recurring followup.
+    Formats:
+        weekly:monday, weekly:thursday, weekly:friday, weekly:sunday
+        monthly:1, monthly:10, monthly:15
+        quarterly
+    """
     today = datetime.date.today()
     base = datetime.date.fromisoformat(current_date) if current_date else today
@@ -1205,11 +1209,12 @@ def _calc_next_recurrence_date(recurrence: str, current_date: str = None) -> str
         target_day = day_map.get(day_name, 0)
         days_ahead = (target_day - today.weekday()) % 7
         if days_ahead == 0:
-            days_ahead = 7
+            days_ahead = 7  # next week, not today
         return (today + datetime.timedelta(days=days_ahead)).isoformat()
     elif recurrence.startswith('monthly:'):
         target_day = int(recurrence.split(':')[1])
+        # Next month from today
         if today.month == 12:
             next_date = datetime.date(today.year + 1, 1, min(target_day, 28))
         else:
@@ -1219,6 +1224,7 @@ def _calc_next_recurrence_date(recurrence: str, current_date: str = None) -> str
         return next_date.isoformat()
     elif recurrence == 'quarterly':
+        # 3 months from current date
         month = base.month + 3
         year = base.year
         if month > 12:
@@ -1252,6 +1258,7 @@ def complete_followup(id: str, result: str = '') -> dict:
     if recurrence:
         next_date = _calc_next_recurrence_date(recurrence, row["date"])
         if next_date:
+            # Rename completed one to include date suffix, then create fresh one
             archived_id = f"{id}-{today}"
             conn.execute("UPDATE followups SET id = ? WHERE id = ?", (archived_id, id))
             conn.commit()
@@ -1829,6 +1836,7 @@ def delete_agent(id: str) -> bool:
 def cleanup_old_changes(retention_days: int = 90) -> int:
     """Delete change_log entries older than retention_days. Returns count deleted."""
     conn = get_db()
+    # Get IDs before deleting so we can clean FTS
     ids = [str(r[0]) for r in conn.execute(
         "SELECT id FROM change_log WHERE created_at < datetime('now', ?)",
         (f"-{retention_days} days",)
@@ -2085,7 +2093,7 @@ def read_session_diary(session_id: str = '', last_n: int = 3, last_day: bool = F
     - session_id: returns entries for that specific session
     - last_day: returns ALL entries from the most recent day (multi-terminal aware)
     - last_n: returns last N entries (default)
-    - domain: filter by project context (e.g., infrastructure, nexo, server, other)
+    - domain: filter by project context (e.g. project-a, project-b, nexo, server, other)
     """
     conn = get_db()
     domain_clause = " AND domain = ?" if domain else ""
@@ -2097,6 +2105,7 @@ def read_session_diary(session_id: str = '', last_n: int = 3, last_day: bool = F
             (session_id,) + domain_params
         ).fetchall()
     elif last_day:
+        # Get all entries from the most recent calendar day
         if domain:
             latest = conn.execute(
                 "SELECT date(created_at) as day FROM session_diary WHERE domain = ? ORDER BY created_at DESC LIMIT 1",
@@ -2121,7 +2130,13 @@ def read_session_diary(session_id: str = '', last_n: int = 3, last_day: bool = F
 def _multi_word_like(query: str, columns: list[str]) -> tuple[str, list]:
-    """Build AND-ed LIKE conditions: every word must appear in at least one of the columns."""
+    """Build AND-ed LIKE conditions: every word must appear in at least one of the columns.
+    Returns (sql_fragment, params) ready for WHERE clause.
+    Example: query="cron learn", columns=["title","content"]
+    → "(title LIKE ? OR content LIKE ?) AND (title LIKE ? OR content LIKE ?)"
+    with params ["%cron%","%cron%","%learn%","%learn%"]
+    """
     words = query.strip().split()
     if not words:
         return "1=1", []
@@ -2136,8 +2151,13 @@ def _multi_word_like(query: str, columns: list[str]) -> tuple[str, list]:
 def recall(query: str, days: int = 30) -> list[dict]:
-    """Cross-search ALL memory using FTS5: learnings, decisions, changes, diary, followups, entities, .md files."""
-    results = fts_search(query, limit=40)
+    """Cross-search ALL memory using FTS5: learnings, decisions, changes, diary, followups, entities, .md files.
+    Returns up to 20 results ranked by relevance (FTS5 bm25).
+    Falls back to LIKE-based search if FTS fails.
+    """
+    # Try FTS5 first (fast, ranked), then filter by days
+    results = fts_search(query, limit=40)  # fetch extra to allow filtering
     if results:
         cutoff_epoch = now_epoch() - (days * 86400)
         filtered = []
@@ -2146,9 +2166,12 @@ def recall(query: str, days: int = 30) -> list[dict]:
             if not ua:
                 filtered.append(r)
                 continue
+            # Normalize to epoch for comparison
             try:
                 if ua[0].isdigit() and ('.' in ua or len(ua) > 12):
+                    # Could be epoch float or ISO date
                     if '-' in ua[:5]:
+                        # ISO datetime like "2026-03-13 16:17:40"
                         dt = datetime.datetime.fromisoformat(ua.replace(' ', 'T'))
                         ts = dt.timestamp()
                     else:
@@ -2158,10 +2181,11 @@ def recall(query: str, days: int = 30) -> list[dict]:
                 if ts >= cutoff_epoch:
                     filtered.append(r)
             except (ValueError, TypeError):
-                filtered.append(r)
+                filtered.append(r)  # keep if can't parse
         if filtered:
             return filtered[:20]
+    # Fallback to old LIKE-based search
     days = max(1, int(days))
     conn = get_db()
     cutoff_dt = datetime.datetime.now() - datetime.timedelta(days=days)

package/src/hooks/auto_capture.py ADDED Viewed

@@ -0,0 +1,208 @@
+#!/usr/bin/env python3
+"""NEXO Auto-Capture Hook — Extract facts from conversation context.
+Inspired by claude-mem's observation handler and transcript processor.
+Uses simple heuristics (no LLM) to extract decisions, corrections,
+and explicit facts from conversation messages.
+Can be called:
+- Programmatically via process_conversation()
+- From Claude Code hooks via stdin (pipe conversation lines)
+- As CLI: python3 auto_capture.py "message1" "message2" ...
+Stores extracted facts via cognitive.ingest() with appropriate tags.
+"""
+import re
+import sys
+from pathlib import Path
+# Add nexo-mcp to path for cognitive imports
+sys.path.insert(0, str(Path(__file__).resolve().parent.parent))
+import cognitive
+# ---------------------------------------------------------------------------
+# Pattern definitions (adapted from claude-mem's transcript processor
+# and ShieldCortex's pattern groups approach)
+# ---------------------------------------------------------------------------
+# Decision patterns — lines indicating a choice was made
+_DECISION_PATTERNS = [
+    re.compile(r'\b(?:decided|agreed|will do|changed to|switching to|going with|chose|chosen|opted for)\b', re.IGNORECASE),
+    re.compile(r'\b(?:let\'?s go with|the plan is|we\'?ll use|moving forward with)\b', re.IGNORECASE),
+    re.compile(r'\b(?:approved|confirmed|locked in|finalized)\b', re.IGNORECASE),
+    re.compile(r'\b(?:decidido|acordado|vamos con|cambiamos a|elegimos)\b', re.IGNORECASE),  # Spanish
+]
+# Correction patterns — lines indicating something was wrong
+_CORRECTION_PATTERNS = [
+    re.compile(r'\b(?:don\'?t|stop|wrong|incorrect|that\'?s not right|fix this)\b', re.IGNORECASE),
+    re.compile(r'\b(?:should be|actually|not that|the correct|mistake|error)\b', re.IGNORECASE),
+    re.compile(r'\b(?:never do that|wrong approach|that broke|revert)\b', re.IGNORECASE),
+    re.compile(r'\b(?:no,\s|nope|mal|otra vez|ya te dije|no es|est[aá] mal)\b', re.IGNORECASE),  # Spanish
+]
+# Explicit fact patterns — user explicitly asks to remember something
+_EXPLICIT_PATTERNS = [
+    re.compile(r'\b(?:remember|note that|important:|keep in mind|don\'?t forget)\b', re.IGNORECASE),
+    re.compile(r'\b(?:for future reference|take note|key point|rule:)\b', re.IGNORECASE),
+    re.compile(r'\b(?:recuerda|importante:|ten en cuenta|no olvides|regla:)\b', re.IGNORECASE),  # Spanish
+]
+# Minimum line length to consider (skip very short lines)
+_MIN_LINE_LENGTH = 15
+# Maximum fact content length
+_MAX_FACT_LENGTH = 500
+def _classify_line(line: str) -> list[tuple[str, str]]:
+    """Classify a single line into fact types.
+    Returns list of (fact_type, content) tuples. A line can match
+    multiple categories.
+    """
+    line = line.strip()
+    if len(line) < _MIN_LINE_LENGTH:
+        return []
+    facts = []
+    for pattern in _DECISION_PATTERNS:
+        if pattern.search(line):
+            facts.append(("decision", line))
+            break
+    for pattern in _CORRECTION_PATTERNS:
+        if pattern.search(line):
+            facts.append(("correction", line))
+            break
+    for pattern in _EXPLICIT_PATTERNS:
+        if pattern.search(line):
+            facts.append(("explicit", line))
+            break
+    return facts
+def process_conversation(messages: list[str]) -> dict:
+    """Process conversation messages and extract key facts.
+    Adapted from claude-mem's TranscriptEventProcessor: scans each message
+    line for decision, correction, and explicit fact patterns. Stores
+    extracted facts via cognitive.ingest() with source_type='auto_capture'.
+    Args:
+        messages: List of conversation message strings
+    Returns:
+        Dict with facts_extracted, decisions, corrections, stored,
+        rejected_by_gate counts and extracted_facts details.
+    """
+    all_facts = []
+    decisions = 0
+    corrections = 0
+    explicits = 0
+    for msg in messages:
+        # Split message into lines and classify each
+        for line in msg.split("\n"):
+            classified = _classify_line(line)
+            for fact_type, content in classified:
+                if fact_type == "decision":
+                    decisions += 1
+                elif fact_type == "correction":
+                    corrections += 1
+                elif fact_type == "explicit":
+                    explicits += 1
+                all_facts.append((fact_type, content[:_MAX_FACT_LENGTH]))
+    # Deduplicate by content (same line might appear in multiple messages)
+    seen = set()
+    unique_facts = []
+    for fact_type, content in all_facts:
+        content_key = content.lower().strip()
+        if content_key not in seen:
+            seen.add(content_key)
+            unique_facts.append((fact_type, content))
+    # Store via cognitive.ingest()
+    stored = 0
+    rejected_by_gate = 0
+    extracted_details = []
+    for fact_type, content in unique_facts:
+        # Build tagged content for better retrieval
+        tagged_content = f"[{fact_type.upper()}] {content}"
+        result_id = cognitive.ingest(
+            content=tagged_content,
+            source_type="auto_capture",
+            source_id=f"hook_{fact_type}",
+            source_title=f"Auto-captured {fact_type}",
+            domain="conversation",
+            source="agent_observation",
+            skip_quarantine=False,  # Route through quarantine for safety
+            bypass_gate=False,      # Let prediction error gate filter duplicates
+        )
+        if result_id == 0:
+            rejected_by_gate += 1
+        else:
+            stored += 1
+        extracted_details.append({
+            "type": fact_type,
+            "content": content[:100],
+            "stored": result_id != 0,
+            "memory_id": result_id,
+        })
+    return {
+        "facts_extracted": len(unique_facts),
+        "decisions": decisions,
+        "corrections": corrections,
+        "explicits": explicits,
+        "stored": stored,
+        "rejected_by_gate": rejected_by_gate,
+        "extracted_facts": extracted_details,
+    }
+def _read_stdin() -> list[str]:
+    """Read conversation lines from stdin (for hook integration)."""
+    if sys.stdin.isatty():
+        return []
+    return [line for line in sys.stdin.read().strip().split("\n") if line.strip()]
+def main():
+    """CLI entry point — accepts messages as args or from stdin.
+    Usage:
+        echo "We decided to use PostgreSQL" | python3 auto_capture.py
+        python3 auto_capture.py "Remember: always use WAL mode" "That's wrong, fix it"
+    """
+    messages = list(sys.argv[1:]) if len(sys.argv) > 1 else _read_stdin()
+    if not messages:
+        print("Usage: python3 auto_capture.py 'message1' 'message2' ...")
+        print("   or: echo 'messages' | python3 auto_capture.py")
+        sys.exit(1)
+    result = process_conversation(messages)
+    print(f"Facts extracted: {result['facts_extracted']}")
+    print(f"  Decisions: {result['decisions']}")
+    print(f"  Corrections: {result['corrections']}")
+    print(f"  Explicits: {result['explicits']}")
+    print(f"Stored: {result['stored']}, Rejected by gate: {result['rejected_by_gate']}")
+    for fact in result["extracted_facts"]:
+        status = "STORED" if fact["stored"] else "REJECTED"
+        print(f"  [{status}] [{fact['type']}] {fact['content']}")
+if __name__ == "__main__":
+    main()