npm - superlocalmemory - Versions diffs - 3.4.0 → 3.4.3 - Mend

superlocalmemory 3.4.0 → 3.4.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

package/README.md +7 -8
package/docs/screenshots/01-dashboard-main.png +0 -0
package/docs/screenshots/02-knowledge-graph.png +0 -0
package/docs/screenshots/03-patterns-learning.png +0 -0
package/docs/screenshots/04-learning-dashboard.png +0 -0
package/docs/screenshots/05-behavioral-analysis.png +0 -0
package/docs/screenshots/06-graph-communities.png +0 -0
package/package.json +2 -2
package/pyproject.toml +11 -2
package/scripts/postinstall.js +26 -7
package/src/superlocalmemory/cli/commands.py +42 -60
package/src/superlocalmemory/cli/daemon.py +107 -47
package/src/superlocalmemory/cli/main.py +10 -0
package/src/superlocalmemory/cli/setup_wizard.py +137 -9
package/src/superlocalmemory/core/config.py +28 -0
package/src/superlocalmemory/core/consolidation_engine.py +38 -1
package/src/superlocalmemory/core/engine.py +9 -0
package/src/superlocalmemory/core/engine_wiring.py +5 -1
package/src/superlocalmemory/core/graph_analyzer.py +254 -12
package/src/superlocalmemory/core/health_monitor.py +313 -0
package/src/superlocalmemory/core/reranker_worker.py +19 -5
package/src/superlocalmemory/ingestion/__init__.py +13 -0
package/src/superlocalmemory/ingestion/adapter_manager.py +234 -0
package/src/superlocalmemory/ingestion/base_adapter.py +177 -0
package/src/superlocalmemory/ingestion/calendar_adapter.py +340 -0
package/src/superlocalmemory/ingestion/credentials.py +118 -0
package/src/superlocalmemory/ingestion/gmail_adapter.py +369 -0
package/src/superlocalmemory/ingestion/parsers.py +100 -0
package/src/superlocalmemory/ingestion/transcript_adapter.py +156 -0
package/src/superlocalmemory/learning/consolidation_worker.py +287 -53
package/src/superlocalmemory/learning/entity_compiler.py +377 -0
package/src/superlocalmemory/mesh/__init__.py +12 -0
package/src/superlocalmemory/mesh/broker.py +344 -0
package/src/superlocalmemory/retrieval/entity_channel.py +141 -4
package/src/superlocalmemory/retrieval/spreading_activation.py +45 -0
package/src/superlocalmemory/server/api.py +15 -8
package/src/superlocalmemory/server/routes/behavioral.py +8 -4
package/src/superlocalmemory/server/routes/chat.py +320 -0
package/src/superlocalmemory/server/routes/entity.py +95 -0
package/src/superlocalmemory/server/routes/ingest.py +110 -0
package/src/superlocalmemory/server/routes/insights.py +368 -0
package/src/superlocalmemory/server/routes/learning.py +106 -6
package/src/superlocalmemory/server/routes/memories.py +20 -9
package/src/superlocalmemory/server/routes/mesh.py +186 -0
package/src/superlocalmemory/server/routes/stats.py +25 -3
package/src/superlocalmemory/server/routes/timeline.py +252 -0
package/src/superlocalmemory/server/routes/v3_api.py +161 -0
package/src/superlocalmemory/server/ui.py +8 -0
package/src/superlocalmemory/server/unified_daemon.py +691 -0
package/src/superlocalmemory/storage/schema_v343.py +229 -0
package/src/superlocalmemory/ui/index.html +168 -58
package/src/superlocalmemory/ui/js/graph-event-bus.js +83 -0
package/src/superlocalmemory/ui/js/graph-filters.js +1 -1
package/src/superlocalmemory/ui/js/knowledge-graph.js +942 -0
package/src/superlocalmemory/ui/js/memory-chat.js +344 -0
package/src/superlocalmemory/ui/js/memory-timeline.js +265 -0
package/src/superlocalmemory/ui/js/quick-actions.js +334 -0
package/src/superlocalmemory.egg-info/PKG-INFO +0 -594
package/src/superlocalmemory.egg-info/SOURCES.txt +0 -279
package/src/superlocalmemory.egg-info/dependency_links.txt +0 -1
package/src/superlocalmemory.egg-info/entry_points.txt +0 -2
package/src/superlocalmemory.egg-info/requires.txt +0 -47
package/src/superlocalmemory.egg-info/top_level.txt +0 -1

package/src/superlocalmemory/learning/consolidation_worker.py CHANGED Viewed

@@ -73,7 +73,38 @@ class ConsolidationWorker:
         except Exception as exc:
             logger.debug("Pattern generation failed: %s", exc)
-        # 4. Check if ranker should retrain
+        # 4. Recompute graph intelligence (v3.4.2: wired into learning pipeline)
+        try:
+            from superlocalmemory.core.graph_analyzer import GraphAnalyzer
+            conn_ga = sqlite3.connect(self._memory_db, timeout=10)
+            conn_ga.execute("PRAGMA busy_timeout=5000")
+            conn_ga.row_factory = sqlite3.Row
+            class _DBProxy:
+                """Minimal DB proxy for GraphAnalyzer compatibility."""
+                def __init__(self, connection: sqlite3.Connection) -> None:
+                    self._conn = connection
+                def execute(self, sql: str, params: tuple = ()) -> list:
+                    cursor = self._conn.execute(sql, params)
+                    if sql.strip().upper().startswith(("INSERT", "UPDATE", "DELETE", "ALTER", "CREATE")):
+                        self._conn.commit()
+                        return []
+                    return cursor.fetchall()
+            ga = GraphAnalyzer(_DBProxy(conn_ga))
+            if not dry_run:
+                ga_result = ga.compute_and_store(profile_id)
+                stats["graph_nodes"] = ga_result.get("node_count", 0)
+                stats["graph_communities"] = ga_result.get("community_count", 0)
+                logger.info(
+                    "Graph analysis: %d nodes, %d communities",
+                    stats["graph_nodes"], stats["graph_communities"],
+                )
+            conn_ga.close()
+        except Exception as exc:
+            logger.debug("Graph analysis failed: %s", exc)
+        # 5. Check if ranker should retrain
         try:
             from superlocalmemory.learning.feedback import FeedbackCollector
             collector = FeedbackCollector(Path(self._learning_db))
@@ -88,6 +119,21 @@ class ConsolidationWorker:
         except Exception as exc:
             logger.debug("Retrain check failed: %s", exc)
+        # 6. Entity compilation (v3.4.3: compiled truth per entity)
+        if not dry_run:
+            try:
+                from superlocalmemory.learning.entity_compiler import EntityCompiler
+                from superlocalmemory.core.config import SLMConfig
+                config = SLMConfig.load()
+                compiler = EntityCompiler(self._memory_db, config)
+                ec_result = compiler.compile_all(profile_id)
+                stats["entities_compiled"] = ec_result.get("compiled", 0)
+                if ec_result["compiled"] > 0:
+                    logger.info("Entity compilation: %d entities compiled",
+                                ec_result["compiled"])
+            except Exception as exc:
+                logger.debug("Entity compilation failed: %s", exc)
         return stats
     def _deduplicate(self, profile_id: str, dry_run: bool) -> int:
@@ -133,127 +179,315 @@ class ConsolidationWorker:
             return 0
     def _generate_patterns(self, profile_id: str, dry_run: bool) -> int:
-        """Mine behavioral patterns from existing memories.
+        """Mine behavioral patterns from ALL memory sources.
-        Scans all facts to detect:
-        - Tech preferences (language/framework mentions)
-        - Topic clusters (frequently discussed subjects)
-        - Temporal patterns (time-of-day activity)
+        v3.4.1: Expanded from 3 to 7 pattern types. No 500-fact cap.
+        Analyzes: facts, signals, co-retrieval edges, channel credits,
+        entities, sessions, graph communities.
         """
         try:
             from superlocalmemory.learning.behavioral import BehavioralPatternStore
             import re
-            from collections import Counter
+            from collections import Counter, defaultdict
             conn = sqlite3.connect(self._memory_db, timeout=10)
             conn.execute("PRAGMA busy_timeout=5000")
             conn.row_factory = sqlite3.Row
+            # v3.4.1: No cap — analyze ALL facts
             facts = conn.execute(
-                "SELECT content, created_at FROM atomic_facts "
-                "WHERE profile_id = ? ORDER BY created_at DESC LIMIT 500",
+                "SELECT fact_id, content, fact_type, created_at, session_id, "
+                "confidence, canonical_entities_json "
+                "FROM atomic_facts "
+                "WHERE profile_id = ? AND lifecycle = 'active' "
+                "ORDER BY created_at DESC",
                 (profile_id,),
             ).fetchall()
-            conn.close()
-            if len(facts) < 10:
+            if len(facts) < 5:
+                conn.close()
                 return 0
             store = BehavioralPatternStore(self._learning_db)
             generated = 0
-            # Tech preferences: detect technology mentions
+            # ── 1. Tech Preferences (expanded keyword list) ───────────
             tech_keywords = {
-                "python": "Python", "javascript": "JavaScript", "typescript": "TypeScript",
-                "react": "React", "vue": "Vue", "angular": "Angular",
-                "postgresql": "PostgreSQL", "mysql": "MySQL", "sqlite": "SQLite",
-                "docker": "Docker", "kubernetes": "Kubernetes", "aws": "AWS",
-                "azure": "Azure", "gcp": "GCP", "node": "Node.js",
-                "fastapi": "FastAPI", "django": "Django", "flask": "Flask",
+                "python": "Python", "javascript": "JavaScript",
+                "typescript": "TypeScript", "react": "React",
+                "vue": "Vue", "angular": "Angular",
+                "postgresql": "PostgreSQL", "mysql": "MySQL",
+                "sqlite": "SQLite", "docker": "Docker",
+                "kubernetes": "Kubernetes", "aws": "AWS",
+                "azure": "Azure", "gcp": "GCP",
+                "node": "Node.js", "fastapi": "FastAPI",
+                "django": "Django", "flask": "Flask",
                 "rust": "Rust", "go": "Go", "java": "Java",
                 "git": "Git", "npm": "npm", "pip": "pip",
-                "langchain": "LangChain", "ollama": "Ollama", "pytorch": "PyTorch",
-                "claude": "Claude", "openai": "OpenAI", "anthropic": "Anthropic",
+                "langchain": "LangChain", "ollama": "Ollama",
+                "pytorch": "PyTorch", "claude": "Claude",
+                "openai": "OpenAI", "anthropic": "Anthropic",
+                "redis": "Redis", "mongodb": "MongoDB",
+                "graphql": "GraphQL", "nextjs": "Next.js",
+                "terraform": "Terraform", "nginx": "Nginx",
+                "linux": "Linux", "macos": "macOS",
+                "vscode": "VS Code", "neovim": "Neovim",
             }
-            tech_counts = Counter()
+            tech_counts: Counter = Counter()
             for f in facts:
                 content = dict(f)["content"].lower()
                 for keyword, label in tech_keywords.items():
                     if keyword in content:
                         tech_counts[label] += 1
-            for tech, count in tech_counts.most_common(15):
-                if count >= 3 and not dry_run:
-                    confidence = min(1.0, count / 20)
+            for tech, count in tech_counts.most_common(20):
+                if count >= 2 and not dry_run:
+                    confidence = min(1.0, count / max(len(facts) * 0.1, 10))
                     store.record_pattern(
                         profile_id=profile_id,
                         pattern_type="tech_preference",
-                        data={"topic": tech, "pattern_key": tech, "value": tech,
-                               "key": "tech", "evidence": count},
+                        data={"topic": tech, "pattern_key": tech,
+                              "value": tech, "key": "tech",
+                              "evidence": count},
                         success_rate=confidence,
                         confidence=confidence,
                     )
                     generated += 1
-            # Topic clusters: most discussed subjects
-            word_counts = Counter()
+            # ── 2. Topic Interests (word frequency) ───────────────────
             stopwords = frozenset({
-                "the", "is", "a", "an", "in", "on", "at", "to", "for", "of",
-                "and", "or", "not", "with", "that", "this", "was", "are", "be",
-                "has", "had", "have", "from", "by", "it", "its", "as", "but",
+                "the", "is", "a", "an", "in", "on", "at", "to", "for",
+                "of", "and", "or", "not", "with", "that", "this", "was",
+                "are", "be", "has", "had", "have", "from", "by", "it",
+                "its", "as", "but", "were", "been", "being", "would",
+                "could", "should", "will", "may", "might", "can", "do",
+                "does", "did", "about", "into", "over", "after", "before",
+                "then", "than", "also", "just", "like", "more", "some",
+                "only", "other", "such", "each", "every", "both", "most",
             })
+            word_counts: Counter = Counter()
             for f in facts:
                 words = re.findall(r'\b[a-zA-Z]{4,}\b', dict(f)["content"].lower())
                 for w in words:
                     if w not in stopwords:
                         word_counts[w] += 1
-            for topic, count in word_counts.most_common(10):
-                if count >= 5 and not dry_run:
-                    confidence = min(1.0, count / 30)
+            for topic, count in word_counts.most_common(15):
+                if count >= 3 and not dry_run:
+                    confidence = min(1.0, count / max(len(facts) * 0.05, 15))
                     store.record_pattern(
                         profile_id=profile_id,
                         pattern_type="interest",
                         data={"topic": topic, "pattern_key": topic,
-                               "count": count, "evidence": count},
+                              "count": count, "evidence": count},
                         success_rate=confidence,
                         confidence=confidence,
                     )
                     generated += 1
-            # Temporal patterns: time-of-day activity
-            hour_counts = Counter()
+            # ── 3. Temporal Activity Patterns ─────────────────────────
+            hour_counts: Counter = Counter()
             for f in facts:
                 created = dict(f).get("created_at", "")
-                if "T" in created:
-                    try:
+                try:
+                    if "T" in created:
                         hour = int(created.split("T")[1][:2])
-                        period = "morning" if 6 <= hour < 12 else (
-                            "afternoon" if 12 <= hour < 18 else (
-                                "evening" if 18 <= hour < 22 else "night"))
-                        hour_counts[period] += 1
-                    except (ValueError, IndexError):
-                        pass
+                    elif " " in created:
+                        hour = int(created.split(" ")[1][:2])
+                    else:
+                        continue
+                    period = ("morning" if 6 <= hour < 12 else
+                              "afternoon" if 12 <= hour < 18 else
+                              "evening" if 18 <= hour < 22 else "night")
+                    hour_counts[period] += 1
+                except (ValueError, IndexError):
+                    pass
+            total_hours = sum(hour_counts.values())
             for period, count in hour_counts.most_common():
-                if count >= 3 and not dry_run:
-                    total = sum(hour_counts.values())
-                    pct = round(count / total * 100)
+                if count >= 2 and total_hours > 0 and not dry_run:
+                    pct = round(count / total_hours * 100)
                     store.record_pattern(
                         profile_id=profile_id,
                         pattern_type="temporal",
                         data={"topic": period, "pattern_key": period,
-                               "value": f"{period} ({pct}%)", "evidence": count,
-                               "key": period, "distribution": dict(hour_counts)},
+                              "value": f"{period} ({pct}%)",
+                              "evidence": count, "key": period,
+                              "distribution": dict(hour_counts)},
                         success_rate=pct / 100,
-                        confidence=min(1.0, count / 20),
+                        confidence=min(1.0, count / max(total_hours * 0.1, 5)),
+                    )
+                    generated += 1
+            # ── 4. Entity Preferences (v3.4.1 NEW) ───────────────────
+            import json as _json
+            entity_counts: Counter = Counter()
+            for f in facts:
+                raw = dict(f).get("canonical_entities_json", "")
+                if raw:
+                    try:
+                        for ent in _json.loads(raw):
+                            entity_counts[ent] += 1
+                    except (ValueError, TypeError):
+                        pass
+            for entity, count in entity_counts.most_common(15):
+                if count >= 3 and not dry_run:
+                    confidence = min(1.0, count / max(len(facts) * 0.05, 10))
+                    store.record_pattern(
+                        profile_id=profile_id,
+                        pattern_type="interest",
+                        data={"topic": entity, "pattern_key": f"entity:{entity}",
+                              "value": entity, "evidence": count,
+                              "source": "entity_frequency"},
+                        success_rate=confidence,
+                        confidence=confidence,
+                    )
+                    generated += 1
+            # ── 5. Session Activity Patterns (v3.4.1 NEW) ────────────
+            session_counts: Counter = Counter()
+            for f in facts:
+                sid = dict(f).get("session_id", "")
+                if sid:
+                    session_counts[sid] += 1
+            if session_counts:
+                avg_facts_per_session = sum(session_counts.values()) / len(session_counts)
+                heavy_sessions = [s for s, c in session_counts.items() if c > avg_facts_per_session * 2]
+                if heavy_sessions and not dry_run:
+                    store.record_pattern(
+                        profile_id=profile_id,
+                        pattern_type="workflow",
+                        data={"pattern_key": "heavy_session_usage",
+                              "value": f"{len(heavy_sessions)} intensive sessions",
+                              "evidence": len(heavy_sessions),
+                              "avg_facts": round(avg_facts_per_session, 1),
+                              "total_sessions": len(session_counts)},
+                        success_rate=0.8,
+                        confidence=min(1.0, len(heavy_sessions) / 5),
+                    )
+                    generated += 1
+            # ── 6. Fact Type Distribution (v3.4.1 NEW) ────────────────
+            type_counts: Counter = Counter()
+            for f in facts:
+                ft = dict(f).get("fact_type", "semantic")
+                type_counts[ft] += 1
+            total_ft = sum(type_counts.values())
+            if total_ft > 0 and not dry_run:
+                dominant_type = type_counts.most_common(1)[0]
+                pct = round(dominant_type[1] / total_ft * 100)
+                store.record_pattern(
+                    profile_id=profile_id,
+                    pattern_type="style",
+                    data={"pattern_key": "memory_style",
+                          "value": f"{dominant_type[0]} dominant ({pct}%)",
+                          "evidence": dominant_type[1],
+                          "distribution": dict(type_counts)},
+                    success_rate=pct / 100,
+                    confidence=min(1.0, dominant_type[1] / 20),
+                )
+                generated += 1
+            # ── 7. Channel Performance (v3.4.1 NEW — from signals) ────
+            try:
+                learn_conn = sqlite3.connect(self._learning_db, timeout=10)
+                learn_conn.row_factory = sqlite3.Row
+                # Retrieval usage patterns from learning_feedback
+                channel_rows = learn_conn.execute(
+                    "SELECT channel, COUNT(*) AS cnt, "
+                    "AVG(signal_value) AS avg_signal "
+                    "FROM learning_feedback "
+                    "WHERE profile_id = ? "
+                    "GROUP BY channel ORDER BY cnt DESC",
+                    (profile_id,),
+                ).fetchall()
+                for row in channel_rows:
+                    d = dict(row)
+                    ch = d.get("channel", "unknown")
+                    cnt = d.get("cnt", 0)
+                    avg_sig = round(float(d.get("avg_signal", 0) or 0), 3)
+                    if cnt >= 5 and not dry_run:
+                        store.record_pattern(
+                            profile_id=profile_id,
+                            pattern_type="style",
+                            data={"pattern_key": f"channel:{ch}",
+                                  "value": f"{ch} ({cnt} hits, {avg_sig} avg)",
+                                  "evidence": cnt,
+                                  "avg_signal": avg_sig},
+                            success_rate=avg_sig,
+                            confidence=min(1.0, cnt / 50),
+                        )
+                        generated += 1
+                # Co-retrieval cluster patterns
+                try:
+                    coret_rows = learn_conn.execute(
+                        "SELECT fact_a, fact_b, co_access_count "
+                        "FROM co_retrieval_edges "
+                        "WHERE profile_id = ? AND co_access_count >= 3 "
+                        "ORDER BY co_access_count DESC LIMIT 20",
+                        (profile_id,),
+                    ).fetchall()
+                    if coret_rows and not dry_run:
+                        store.record_pattern(
+                            profile_id=profile_id,
+                            pattern_type="workflow",
+                            data={"pattern_key": "co_retrieval_clusters",
+                                  "value": f"{len(coret_rows)} strong fact pairs",
+                                  "evidence": len(coret_rows),
+                                  "top_pair_count": dict(coret_rows[0]).get("co_access_count", 0) if coret_rows else 0},
+                            success_rate=0.7,
+                            confidence=min(1.0, len(coret_rows) / 10),
+                        )
+                        generated += 1
+                except Exception:
+                    pass
+                learn_conn.close()
+            except Exception as exc:
+                logger.debug("Signal pattern mining failed: %s", exc)
+            # ── 8. Community Membership (v3.4.1 NEW — from graph) ─────
+            try:
+                comm_rows = conn.execute(
+                    "SELECT community_id, COUNT(*) AS cnt "
+                    "FROM fact_importance "
+                    "WHERE profile_id = ? AND community_id IS NOT NULL "
+                    "GROUP BY community_id ORDER BY cnt DESC",
+                    (profile_id,),
+                ).fetchall()
+                if comm_rows and not dry_run:
+                    total_comm = sum(dict(r)["cnt"] for r in comm_rows)
+                    store.record_pattern(
+                        profile_id=profile_id,
+                        pattern_type="style",
+                        data={"pattern_key": "knowledge_structure",
+                              "value": f"{len(comm_rows)} topic communities, {total_comm} classified facts",
+                              "evidence": total_comm,
+                              "community_count": len(comm_rows)},
+                        success_rate=0.8,
+                        confidence=min(1.0, len(comm_rows) / 5),
                     )
                     generated += 1
+            except Exception:
+                pass
+            conn.close()
+            logger.info(
+                "Pattern mining: %d patterns generated for profile %s "
+                "from %d facts",
+                generated, profile_id, len(facts),
+            )
             return generated
         except Exception as exc:
-            logger.debug("Pattern generation error: %s", exc)
+            logger.warning("Pattern generation error: %s", exc)
             return 0
     def _retrain_ranker(self, profile_id: str, signal_count: int) -> bool: