npm - superlocalmemory - Versions diffs - 3.4.0 → 3.4.3 - Mend

superlocalmemory 3.4.0 → 3.4.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

package/README.md +7 -8
package/docs/screenshots/01-dashboard-main.png +0 -0
package/docs/screenshots/02-knowledge-graph.png +0 -0
package/docs/screenshots/03-patterns-learning.png +0 -0
package/docs/screenshots/04-learning-dashboard.png +0 -0
package/docs/screenshots/05-behavioral-analysis.png +0 -0
package/docs/screenshots/06-graph-communities.png +0 -0
package/package.json +2 -2
package/pyproject.toml +11 -2
package/scripts/postinstall.js +26 -7
package/src/superlocalmemory/cli/commands.py +42 -60
package/src/superlocalmemory/cli/daemon.py +107 -47
package/src/superlocalmemory/cli/main.py +10 -0
package/src/superlocalmemory/cli/setup_wizard.py +137 -9
package/src/superlocalmemory/core/config.py +28 -0
package/src/superlocalmemory/core/consolidation_engine.py +38 -1
package/src/superlocalmemory/core/engine.py +9 -0
package/src/superlocalmemory/core/engine_wiring.py +5 -1
package/src/superlocalmemory/core/graph_analyzer.py +254 -12
package/src/superlocalmemory/core/health_monitor.py +313 -0
package/src/superlocalmemory/core/reranker_worker.py +19 -5
package/src/superlocalmemory/ingestion/__init__.py +13 -0
package/src/superlocalmemory/ingestion/adapter_manager.py +234 -0
package/src/superlocalmemory/ingestion/base_adapter.py +177 -0
package/src/superlocalmemory/ingestion/calendar_adapter.py +340 -0
package/src/superlocalmemory/ingestion/credentials.py +118 -0
package/src/superlocalmemory/ingestion/gmail_adapter.py +369 -0
package/src/superlocalmemory/ingestion/parsers.py +100 -0
package/src/superlocalmemory/ingestion/transcript_adapter.py +156 -0
package/src/superlocalmemory/learning/consolidation_worker.py +287 -53
package/src/superlocalmemory/learning/entity_compiler.py +377 -0
package/src/superlocalmemory/mesh/__init__.py +12 -0
package/src/superlocalmemory/mesh/broker.py +344 -0
package/src/superlocalmemory/retrieval/entity_channel.py +141 -4
package/src/superlocalmemory/retrieval/spreading_activation.py +45 -0
package/src/superlocalmemory/server/api.py +15 -8
package/src/superlocalmemory/server/routes/behavioral.py +8 -4
package/src/superlocalmemory/server/routes/chat.py +320 -0
package/src/superlocalmemory/server/routes/entity.py +95 -0
package/src/superlocalmemory/server/routes/ingest.py +110 -0
package/src/superlocalmemory/server/routes/insights.py +368 -0
package/src/superlocalmemory/server/routes/learning.py +106 -6
package/src/superlocalmemory/server/routes/memories.py +20 -9
package/src/superlocalmemory/server/routes/mesh.py +186 -0
package/src/superlocalmemory/server/routes/stats.py +25 -3
package/src/superlocalmemory/server/routes/timeline.py +252 -0
package/src/superlocalmemory/server/routes/v3_api.py +161 -0
package/src/superlocalmemory/server/ui.py +8 -0
package/src/superlocalmemory/server/unified_daemon.py +691 -0
package/src/superlocalmemory/storage/schema_v343.py +229 -0
package/src/superlocalmemory/ui/index.html +168 -58
package/src/superlocalmemory/ui/js/graph-event-bus.js +83 -0
package/src/superlocalmemory/ui/js/graph-filters.js +1 -1
package/src/superlocalmemory/ui/js/knowledge-graph.js +942 -0
package/src/superlocalmemory/ui/js/memory-chat.js +344 -0
package/src/superlocalmemory/ui/js/memory-timeline.js +265 -0
package/src/superlocalmemory/ui/js/quick-actions.js +334 -0
package/src/superlocalmemory.egg-info/PKG-INFO +0 -594
package/src/superlocalmemory.egg-info/SOURCES.txt +0 -279
package/src/superlocalmemory.egg-info/dependency_links.txt +0 -1
package/src/superlocalmemory.egg-info/entry_points.txt +0 -2
package/src/superlocalmemory.egg-info/requires.txt +0 -47
package/src/superlocalmemory.egg-info/top_level.txt +0 -1

package/src/superlocalmemory/server/routes/chat.py ADDED Viewed

@@ -0,0 +1,320 @@
+# Copyright (c) 2026 Varun Pratap Bhardwaj / Qualixar
+# Licensed under AGPL-3.0-or-later — see LICENSE file
+# Part of SuperLocalMemory v3.4.1 | https://qualixar.com
+"""Ask My Memory — SSE chat endpoint.
+Flow: query → 6-channel retrieval → format context → LLM stream → SSE
+Mode A: No LLM, returns formatted retrieval results.
+Mode B: Ollama local streaming via /api/chat.
+Mode C: Cloud LLM streaming (OpenAI-compatible).
+Part of Qualixar | Author: Varun Pratap Bhardwaj
+"""
+from __future__ import annotations
+import asyncio
+import json
+import logging
+import re
+from typing import AsyncGenerator
+import httpx
+from fastapi import APIRouter, Request
+from fastapi.responses import StreamingResponse
+logger = logging.getLogger(__name__)
+router = APIRouter(tags=["chat"])
+# Citation marker pattern: [MEM-1], [MEM-2], etc.
+_CITATION_RE = re.compile(r"\[MEM-(\d+)\]")
+# System prompt for LLM — instructs citation usage
+_SYSTEM_PROMPT = (
+    "You are a memory assistant. Answer the user's question using ONLY the "
+    "provided memories. When you use information from a memory, include its "
+    "marker inline, e.g. [MEM-1]. If no memories are relevant, say so. "
+    "Be concise and factual."
+)
+# ── SSE Stream Endpoint ─────────────────────────────────────────
+@router.post("/api/v3/chat/stream")
+async def chat_stream(request: Request):
+    """Stream a memory-grounded chat response via SSE.
+    Body: {"query": "...", "mode": "a"|"b"|"c", "limit": 10}
+    Response: text/event-stream with events: token, citation, done, error
+    """
+    try:
+        body = await request.json()
+    except Exception:
+        return StreamingResponse(
+            _sse_error("Invalid JSON body"),
+            media_type="text/event-stream",
+        )
+    query = (body.get("query") or "").strip()
+    if not query:
+        return StreamingResponse(
+            _sse_error("Query is required"),
+            media_type="text/event-stream",
+        )
+    mode = (body.get("mode") or "a").lower()
+    limit = min(body.get("limit", 10), 20)
+    return StreamingResponse(
+        _stream_chat(query, mode, limit),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "X-Accel-Buffering": "no",          # nginx
+            "Content-Encoding": "identity",      # bypass GZipMiddleware
+        },
+    )
+# ── Core Chat Logic ──────────────────────────────────────────────
+async def _stream_chat(
+    query: str, mode: str, limit: int,
+) -> AsyncGenerator[str, None]:
+    """Retrieve memories, then stream LLM response with citations."""
+    # Step 1: Retrieve memories via WorkerPool (run in executor to avoid blocking)
+    memories = []
+    try:
+        loop = asyncio.get_event_loop()
+        memories = await loop.run_in_executor(None, _recall_memories, query, limit)
+    except Exception as exc:
+        yield _sse_event("error", json.dumps({"message": f"Retrieval failed: {exc}"}))
+        yield _sse_event("done", "")
+        return
+    if not memories:
+        yield _sse_event("token", "No relevant memories found for your query.")
+        yield _sse_event("done", "")
+        return
+    # Step 2: Send citation metadata
+    for i, mem in enumerate(memories):
+        citation_data = {
+            "index": i + 1,
+            "fact_id": mem.get("fact_id", ""),
+            "content_preview": (mem.get("content") or "")[:80],
+            "trust_score": mem.get("trust_score", 0),
+            "score": mem.get("score", 0),
+        }
+        yield _sse_event("citation", json.dumps(citation_data))
+    # Step 3: Route to appropriate mode
+    if mode == "a":
+        # Mode A: No LLM — return formatted retrieval results
+        async for event in _stream_mode_a(query, memories):
+            yield event
+    elif mode in ("b", "c"):
+        # Mode B/C: LLM streaming
+        async for event in _stream_mode_bc(query, memories, mode):
+            yield event
+    else:
+        yield _sse_event("token", "Unknown mode. Use a, b, or c.")
+    yield _sse_event("done", "")
+# ── Mode A: Raw Retrieval Results ────────────────────────────────
+async def _stream_mode_a(
+    query: str, memories: list,
+) -> AsyncGenerator[str, None]:
+    """Format retrieval results as readable answer (no LLM).
+    Mode A = zero-cloud. No LLM available, so we show raw retrieval
+    results in a structured format. For conversational AI answers,
+    users should switch to Mode B (Ollama) or Mode C (Cloud) in Settings.
+    """
+    yield _sse_event("token", "**Mode A — Raw Memory Retrieval** (no LLM connected)\n")
+    yield _sse_event("token", "For AI-powered answers, switch to Mode B or C in Settings.\n")
+    yield _sse_event("token", f"Found **{len(memories)}** relevant memories for: *{query}*\n\n")
+    await asyncio.sleep(0.03)
+    for i, mem in enumerate(memories):
+        content = mem.get("content") or mem.get("source_content") or ""
+        score = mem.get("score", 0)
+        trust = mem.get("trust_score", 0)
+        text = (
+            f"**[MEM-{i+1}]** (relevance: {score:.2f}, trust: {trust:.2f})\n"
+            f"{content}\n\n"
+        )
+        yield _sse_event("token", text)
+        await asyncio.sleep(0.03)
+# ── Mode B/C: LLM Streaming ─────────────────────────────────────
+async def _stream_mode_bc(
+    query: str, memories: list, mode: str,
+) -> AsyncGenerator[str, None]:
+    """Stream LLM response with memory context and citation detection."""
+    # Build context with citation markers
+    context_parts = []
+    for i, mem in enumerate(memories):
+        content = mem.get("content") or mem.get("source_content") or ""
+        trust = mem.get("trust_score", 0)
+        context_parts.append(f"[MEM-{i+1}] {content} (trust: {trust:.2f})")
+    context = "\n".join(context_parts)
+    messages = [
+        {"role": "system", "content": _SYSTEM_PROMPT},
+        {"role": "user", "content": f"Memories:\n{context}\n\nQuestion: {query}"},
+    ]
+    # Load LLM config
+    try:
+        from superlocalmemory.core.config import SLMConfig
+        config = SLMConfig.load()
+        provider = config.llm.provider or ""
+        model = config.llm.model or ""
+        api_key = config.llm.api_key or ""
+        api_base = config.llm.api_base or ""
+    except Exception:
+        yield _sse_event("token", "LLM not configured. Use Mode A or configure a provider in Settings.")
+        return
+    if not provider:
+        yield _sse_event("token", "No LLM provider configured. Showing raw results instead.\n\n")
+        async for event in _stream_mode_a(query, memories):
+            yield event
+        return
+    # Stream from provider
+    try:
+        if provider == "ollama":
+            async for token in _stream_ollama(messages, model, api_base):
+                yield _sse_event("token", token)
+        else:
+            async for token in _stream_openai_compat(
+                messages, model, api_key, api_base, provider,
+            ):
+                yield _sse_event("token", token)
+    except httpx.ConnectError:
+        yield _sse_event("token", f"\n\n[Connection failed — is {provider} running?]")
+    except Exception as exc:
+        yield _sse_event("token", f"\n\n[LLM error: {exc}]")
+# ── Ollama Streaming (/api/chat with messages) ───────────────────
+async def _stream_ollama(
+    messages: list, model: str, api_base: str,
+) -> AsyncGenerator[str, None]:
+    """Stream tokens from Ollama /api/chat endpoint."""
+    import os
+    base = api_base or os.environ.get("OLLAMA_HOST", "http://localhost:11434")
+    url = f"{base.rstrip('/')}/api/chat"
+    payload = {
+        "model": model or "llama3.2",
+        "messages": messages,
+        "stream": True,
+        "options": {"num_predict": 1024, "temperature": 0.3, "num_ctx": 4096},
+    }
+    async with httpx.AsyncClient(timeout=httpx.Timeout(120.0)) as client:
+        async with client.stream("POST", url, json=payload) as resp:
+            resp.raise_for_status()
+            async for line in resp.aiter_lines():
+                if not line:
+                    continue
+                try:
+                    chunk = json.loads(line)
+                    if chunk.get("done"):
+                        break
+                    token = chunk.get("message", {}).get("content", "")
+                    if token:
+                        yield token
+                except json.JSONDecodeError:
+                    continue
+# ── OpenAI-Compatible Streaming ──────────────────────────────────
+async def _stream_openai_compat(
+    messages: list, model: str, api_key: str,
+    api_base: str, provider: str,
+) -> AsyncGenerator[str, None]:
+    """Stream tokens from OpenAI-compatible API (OpenAI, Azure, OpenRouter)."""
+    import os
+    if provider == "azure":
+        url = api_base  # Azure uses full deployment URL
+        headers = {"api-key": api_key, "Content-Type": "application/json"}
+    elif provider == "openrouter":
+        url = api_base or "https://openrouter.ai/api/v1/chat/completions"
+        headers = {"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"}
+    elif provider == "anthropic":
+        # Anthropic uses a different streaming format — simplified here
+        url = api_base or "https://api.anthropic.com/v1/messages"
+        headers = {
+            "x-api-key": api_key,
+            "anthropic-version": "2023-06-01",
+            "Content-Type": "application/json",
+        }
+    else:
+        url = api_base or "https://api.openai.com/v1/chat/completions"
+        headers = {"Authorization": f"Bearer {api_key}", "Content-Type": "application/json"}
+    payload = {
+        "model": model,
+        "messages": messages,
+        "stream": True,
+        "max_tokens": 1024,
+        "temperature": 0.3,
+    }
+    async with httpx.AsyncClient(timeout=httpx.Timeout(120.0)) as client:
+        async with client.stream("POST", url, json=payload, headers=headers) as resp:
+            resp.raise_for_status()
+            async for line in resp.aiter_lines():
+                if not line.startswith("data: "):
+                    continue
+                data = line[6:]
+                if data == "[DONE]":
+                    break
+                try:
+                    chunk = json.loads(data)
+                    token = chunk.get("choices", [{}])[0].get("delta", {}).get("content", "")
+                    if token:
+                        yield token
+                except json.JSONDecodeError:
+                    continue
+# ── Retrieval Helper ─────────────────────────────────────────────
+def _recall_memories(query: str, limit: int) -> list:
+    """Run 6-channel retrieval via WorkerPool (synchronous, runs in executor)."""
+    from superlocalmemory.core.worker_pool import WorkerPool
+    pool = WorkerPool.shared()
+    result = pool.recall(query, limit=limit)
+    if result.get("ok"):
+        return result.get("results", [])
+    return []
+# ── SSE Formatting ───────────────────────────────────────────────
+def _sse_event(event_type: str, data: str) -> str:
+    """Format a single SSE event."""
+    return f"event: {event_type}\ndata: {data}\n\n"
+async def _sse_error(message: str) -> AsyncGenerator[str, None]:
+    """Yield a single SSE error event."""
+    yield _sse_event("error", json.dumps({"message": message}))
+    yield _sse_event("done", "")

package/src/superlocalmemory/server/routes/entity.py ADDED Viewed

@@ -0,0 +1,95 @@
+# Copyright (c) 2026 Varun Pratap Bhardwaj / Qualixar
+# Licensed under the Elastic License 2.0 - see LICENSE file
+# Part of SuperLocalMemory V3 | https://qualixar.com | https://varunpratap.com
+"""Entity compilation API routes — view and recompile entity summaries."""
+from __future__ import annotations
+from fastapi import APIRouter, HTTPException, Request, Query
+router = APIRouter(prefix="/api/entity", tags=["entity"])
+@router.get("/{entity_name}")
+async def get_entity(
+    entity_name: str,
+    request: Request,
+    profile: str = Query(default="default"),
+    project: str = Query(default=""),
+):
+    """Get compiled truth + timeline for an entity."""
+    engine = request.app.state.engine
+    if engine is None:
+        raise HTTPException(503, detail="Engine not initialized")
+    import sqlite3
+    import json
+    conn = sqlite3.connect(str(engine._config.db_path))
+    conn.row_factory = sqlite3.Row
+    try:
+        # Search by canonical_name (case-insensitive)
+        row = conn.execute("""
+            SELECT ep.compiled_truth, ep.timeline, ep.fact_ids_json,
+                   ep.last_compiled_at, ep.compilation_confidence,
+                   ep.knowledge_summary, ce.entity_type
+            FROM entity_profiles ep
+            JOIN canonical_entities ce ON ep.entity_id = ce.entity_id
+            WHERE LOWER(ce.canonical_name) = LOWER(?)
+              AND ep.profile_id = ?
+              AND ep.project_name = ?
+        """, (entity_name, profile, project)).fetchone()
+        if not row:
+            raise HTTPException(404, detail=f"Entity '{entity_name}' not found")
+        return {
+            "entity_name": entity_name,
+            "entity_type": row["entity_type"],
+            "compiled_truth": row["compiled_truth"] or "",
+            "knowledge_summary": row["knowledge_summary"] or "",
+            "timeline": json.loads(row["timeline"]) if row["timeline"] else [],
+            "source_fact_ids": json.loads(row["fact_ids_json"]) if row["fact_ids_json"] else [],
+            "last_compiled_at": row["last_compiled_at"],
+            "confidence": row["compilation_confidence"],
+        }
+    finally:
+        conn.close()
+@router.post("/{entity_name}/recompile")
+async def recompile_entity(
+    entity_name: str,
+    request: Request,
+    profile: str = Query(default="default"),
+    project: str = Query(default=""),
+):
+    """Force immediate recompilation of an entity."""
+    engine = request.app.state.engine
+    if engine is None:
+        raise HTTPException(503, detail="Engine not initialized")
+    import sqlite3
+    conn = sqlite3.connect(str(engine._config.db_path))
+    conn.row_factory = sqlite3.Row
+    try:
+        entity = conn.execute(
+            "SELECT entity_id, canonical_name, entity_type FROM canonical_entities "
+            "WHERE LOWER(canonical_name) = LOWER(?) AND profile_id = ?",
+            (entity_name, profile),
+        ).fetchone()
+        if not entity:
+            raise HTTPException(404, detail=f"Entity '{entity_name}' not found")
+        from superlocalmemory.learning.entity_compiler import EntityCompiler
+        compiler = EntityCompiler(str(engine._config.db_path), engine._config)
+        result = compiler.compile_entity(
+            profile, project, entity["entity_id"], entity["canonical_name"],
+        )
+        if result:
+            return {"ok": True, **result}
+        return {"ok": False, "reason": "no facts to compile"}
+    finally:
+        conn.close()

package/src/superlocalmemory/server/routes/ingest.py ADDED Viewed

@@ -0,0 +1,110 @@
+# Copyright (c) 2026 Varun Pratap Bhardwaj / Qualixar
+# Licensed under the Elastic License 2.0 - see LICENSE file
+# Part of SuperLocalMemory V3 | https://qualixar.com | https://varunpratap.com
+"""Ingestion endpoint — accepts data from external adapters.
+POST /ingest with {content, source_type, dedup_key, metadata}.
+Deduplicates by source_type + dedup_key. Stores via MemoryEngine.
+Admission control: max 10 concurrent ingestions (HTTP 429 on overflow).
+Part of Qualixar | Author: Varun Pratap Bhardwaj
+"""
+from __future__ import annotations
+import json
+import sqlite3
+import threading
+from datetime import datetime, timezone
+from fastapi import APIRouter, HTTPException, Request
+from pydantic import BaseModel
+router = APIRouter(tags=["ingestion"])
+_MAX_CONCURRENT = 10
+_active_count = 0
+_active_lock = threading.Lock()
+class IngestRequest(BaseModel):
+    content: str
+    source_type: str
+    dedup_key: str
+    metadata: dict = {}
+@router.post("/ingest")
+async def ingest(req: IngestRequest, request: Request):
+    """Ingest content from an external adapter.
+    Deduplicates by (source_type, dedup_key). Returns 429 if too many
+    concurrent ingestions. Stores via the singleton MemoryEngine.
+    """
+    global _active_count
+    engine = request.app.state.engine
+    if engine is None:
+        raise HTTPException(503, detail="Engine not initialized")
+    if not req.content:
+        raise HTTPException(400, detail="content required")
+    if not req.source_type:
+        raise HTTPException(400, detail="source_type required")
+    if not req.dedup_key:
+        raise HTTPException(400, detail="dedup_key required")
+    # Admission control
+    with _active_lock:
+        if _active_count >= _MAX_CONCURRENT:
+            raise HTTPException(
+                429,
+                detail="Too many concurrent ingestions",
+                headers={"Retry-After": "5"},
+            )
+        _active_count += 1
+    try:
+        # Dedup check
+        conn = sqlite3.connect(str(engine._config.db_path))
+        try:
+            existing = conn.execute(
+                "SELECT id FROM ingestion_log WHERE source_type=? AND dedup_key=?",
+                (req.source_type, req.dedup_key),
+            ).fetchone()
+            if existing:
+                return {"ingested": False, "reason": "already_ingested"}
+        finally:
+            conn.close()
+        # Store via engine
+        metadata = {**req.metadata, "source_type": req.source_type}
+        fact_ids = engine.store(req.content, metadata=metadata)
+        # Log to ingestion_log
+        conn = sqlite3.connect(str(engine._config.db_path))
+        try:
+            conn.execute(
+                "INSERT OR IGNORE INTO ingestion_log "
+                "(source_type, dedup_key, fact_ids, metadata, status, ingested_at) "
+                "VALUES (?, ?, ?, ?, 'ingested', ?)",
+                (
+                    req.source_type,
+                    req.dedup_key,
+                    json.dumps(fact_ids),
+                    json.dumps(req.metadata),
+                    datetime.now(timezone.utc).isoformat(),
+                ),
+            )
+            conn.commit()
+        finally:
+            conn.close()
+        return {"ingested": True, "fact_ids": fact_ids}
+    except Exception as exc:
+        raise HTTPException(500, detail=str(exc))
+    finally:
+        with _active_lock:
+            _active_count -= 1