PyPI - cortex-mem - Versions diffs - 1.0.0__py3-none-any.whl - Mend

cortex-mem 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

cortex/__init__.py +0 -0
cortex/db.py +135 -0
cortex/schema.sql +75 -0
cortex/tier_generator.py +280 -0
cortex/tiered_retrieval.py +335 -0
cortex_mem/__init__.py +5 -0
cortex_mem/__version__.py +1 -0
cortex_mem/cli.py +170 -0
cortex_mem/openclaw_plugin.py +73 -0
cortex_mem/openclaw_provider.py +68 -0
cortex_mem-1.0.0.dist-info/METADATA +153 -0
cortex_mem-1.0.0.dist-info/RECORD +22 -0
cortex_mem-1.0.0.dist-info/WHEEL +5 -0
cortex_mem-1.0.0.dist-info/entry_points.txt +5 -0
cortex_mem-1.0.0.dist-info/licenses/LICENSE +21 -0
cortex_mem-1.0.0.dist-info/top_level.txt +3 -0
service/__init__.py +0 -0
service/api.py +311 -0
service/client.py +105 -0
service/config.yaml +36 -0
service/models.py +69 -0
service/storage.py +336 -0

cortex/__init__.py ADDED Viewed

File without changes

cortex/db.py ADDED Viewed

@@ -0,0 +1,135 @@
+"""
+SQLite metadata store for Cortex tiered documents.
+Thread-safe, async-compatible via aiosqlite.
+"""
+import json
+import sqlite3
+import uuid
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+DB_PATH = Path(__file__).parent.parent / "index" / "cortex_tiers.db"
+SCHEMA_PATH = Path(__file__).parent / "schema.sql"
+def _get_conn(db_path: Path = DB_PATH) -> sqlite3.Connection:
+    db_path.parent.mkdir(parents=True, exist_ok=True)
+    conn = sqlite3.connect(str(db_path))
+    conn.row_factory = sqlite3.Row
+    conn.execute("PRAGMA journal_mode=WAL")
+    conn.execute("PRAGMA foreign_keys=ON")
+    return conn
+def init_db(db_path: Path = DB_PATH) -> sqlite3.Connection:
+    conn = _get_conn(db_path)
+    with open(SCHEMA_PATH) as f:
+        conn.executescript(f.read())
+    conn.commit()
+    return conn
+def insert_document(conn: sqlite3.Connection, doc: Dict[str, Any]) -> str:
+    doc_id = doc.get("doc_id") or str(uuid.uuid4())
+    tags = json.dumps(doc.get("tags", []))
+    conn.execute(
+        """
+        INSERT OR REPLACE INTO documents (
+            doc_id, hierarchy_path, title, doc_type,
+            l0_abstract, l0_token_count,
+            l1_overview, l1_token_count,
+            l2_file_path, l2_token_count, l2_checksum,
+            chromadb_l0_id, chromadb_l1_id,
+            parent_path, depth, tags,
+            l0_generated_at, l1_generated_at,
+            source_type, cortex_tier
+        ) VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+        """,
+        (
+            doc_id,
+            doc["hierarchy_path"],
+            doc["title"],
+            doc["doc_type"],
+            doc["l0_abstract"],
+            doc["l0_token_count"],
+            doc.get("l1_overview"),
+            doc.get("l1_token_count", 0),
+            doc["l2_file_path"],
+            doc.get("l2_token_count", 0),
+            doc["l2_checksum"],
+            doc.get("chromadb_l0_id"),
+            doc.get("chromadb_l1_id"),
+            doc.get("parent_path"),
+            doc.get("depth", 0),
+            tags,
+            doc.get("l0_generated_at"),
+            doc.get("l1_generated_at"),
+            doc.get("source_type", "manual"),
+            doc.get("cortex_tier"),
+        ),
+    )
+    conn.commit()
+    return doc_id
+def get_document(conn: sqlite3.Connection, doc_id: str) -> Optional[Dict[str, Any]]:
+    row = conn.execute("SELECT * FROM documents WHERE doc_id = ?", (doc_id,)).fetchone()
+    if row is None:
+        return None
+    return _row_to_dict(row)
+def get_all_documents(conn: sqlite3.Connection) -> List[Dict[str, Any]]:
+    rows = conn.execute("SELECT * FROM documents ORDER BY updated_at DESC").fetchall()
+    return [_row_to_dict(r) for r in rows]
+def search_by_hierarchy(
+    conn: sqlite3.Connection, prefix: str
+) -> List[Dict[str, Any]]:
+    rows = conn.execute(
+        "SELECT * FROM documents WHERE hierarchy_path LIKE ? ORDER BY hierarchy_path",
+        (prefix + "%",),
+    ).fetchall()
+    return [_row_to_dict(r) for r in rows]
+def mark_stale(conn: sqlite3.Connection, doc_id: str, reason: str):
+    conn.execute(
+        "UPDATE documents SET is_stale = 1, stale_reason = ? WHERE doc_id = ?",
+        (reason, doc_id),
+    )
+    conn.commit()
+def log_query(
+    conn: sqlite3.Connection,
+    query_text: str,
+    l0_results: int,
+    l1_expansions: int,
+    l2_loads: int,
+    total_tokens: int,
+    latency_ms: int,
+    agent_id: Optional[str] = None,
+):
+    conn.execute(
+        """
+        INSERT INTO query_log (query_id, query_text, agent_id,
+            l0_results, l1_expansions, l2_loads, total_tokens, latency_ms)
+        VALUES (?, ?, ?, ?, ?, ?, ?, ?)
+        """,
+        (str(uuid.uuid4()), query_text, agent_id,
+         l0_results, l1_expansions, l2_loads, total_tokens, latency_ms),
+    )
+    conn.commit()
+def _row_to_dict(row: sqlite3.Row) -> Dict[str, Any]:
+    d = dict(row)
+    if isinstance(d.get("tags"), str):
+        try:
+            d["tags"] = json.loads(d["tags"])
+        except (json.JSONDecodeError, TypeError):
+            d["tags"] = []
+    d["is_stale"] = bool(d.get("is_stale"))
+    return d

cortex/schema.sql ADDED Viewed

@@ -0,0 +1,75 @@
+-- Cortex Tiered Retrieval — SQLite schema
+-- Equivalent to cortex_tiers PostgreSQL schema from master plan.
+-- Stores document metadata + L0/L1 content; L2 lives on filesystem.
+CREATE TABLE IF NOT EXISTS documents (
+    doc_id          TEXT PRIMARY KEY,
+    hierarchy_path  TEXT NOT NULL,
+    title           TEXT NOT NULL,
+    doc_type        TEXT NOT NULL CHECK (doc_type IN (
+        'strategy', 'backtest', 'research', 'episode',
+        'skill', 'pattern', 'session_learning', 'reference'
+    )),
+    -- Tier content
+    l0_abstract     TEXT NOT NULL,
+    l0_token_count  INTEGER NOT NULL,
+    l1_overview     TEXT,
+    l1_token_count  INTEGER DEFAULT 0,
+    l2_file_path    TEXT NOT NULL,
+    l2_token_count  INTEGER DEFAULT 0,
+    l2_checksum     TEXT NOT NULL,
+    -- ChromaDB references
+    chromadb_l0_id  TEXT,
+    chromadb_l1_id  TEXT,
+    -- Hierarchy
+    parent_path     TEXT,
+    depth           INTEGER DEFAULT 0,
+    tags            TEXT DEFAULT '[]',
+    -- Timestamps
+    created_at      TEXT DEFAULT (strftime('%Y-%m-%dT%H:%M:%fZ', 'now')),
+    updated_at      TEXT DEFAULT (strftime('%Y-%m-%dT%H:%M:%fZ', 'now')),
+    l0_generated_at TEXT,
+    l1_generated_at TEXT,
+    -- Invalidation
+    is_stale        INTEGER DEFAULT 0,
+    stale_reason    TEXT,
+    -- Source tracking
+    source_type     TEXT DEFAULT 'manual',
+    cortex_tier     TEXT CHECK (cortex_tier IN ('episodic', 'semantic', 'procedural') OR cortex_tier IS NULL)
+);
+CREATE INDEX IF NOT EXISTS idx_docs_hierarchy ON documents (hierarchy_path);
+CREATE INDEX IF NOT EXISTS idx_docs_parent ON documents (parent_path);
+CREATE INDEX IF NOT EXISTS idx_docs_type ON documents (doc_type);
+CREATE INDEX IF NOT EXISTS idx_docs_stale ON documents (is_stale) WHERE is_stale = 1;
+CREATE TABLE IF NOT EXISTS directories (
+    dir_id      TEXT PRIMARY KEY,
+    path        TEXT UNIQUE NOT NULL,
+    parent_path TEXT,
+    name        TEXT NOT NULL,
+    description TEXT,
+    doc_count   INTEGER DEFAULT 0,
+    created_at  TEXT DEFAULT (strftime('%Y-%m-%dT%H:%M:%fZ', 'now')),
+    updated_at  TEXT DEFAULT (strftime('%Y-%m-%dT%H:%M:%fZ', 'now'))
+);
+CREATE INDEX IF NOT EXISTS idx_dirs_parent ON directories (parent_path);
+CREATE TABLE IF NOT EXISTS query_log (
+    query_id    TEXT PRIMARY KEY,
+    query_text  TEXT NOT NULL,
+    agent_id    TEXT,
+    l0_results  INTEGER DEFAULT 0,
+    l1_expansions INTEGER DEFAULT 0,
+    l2_loads    INTEGER DEFAULT 0,
+    total_tokens INTEGER DEFAULT 0,
+    latency_ms  INTEGER DEFAULT 0,
+    created_at  TEXT DEFAULT (strftime('%Y-%m-%dT%H:%M:%fZ', 'now'))
+);

cortex/tier_generator.py ADDED Viewed

@@ -0,0 +1,280 @@
+"""
+TierGenerator — auto-generates L0/L1 tiers from L2 (full) documents.
+Uses Ollama (deepseek-r1:7b) for summarization and ChromaDB for vector indexing.
+Prompts follow MEMORY_ARCHITECTURE_MASTER_PLAN.md Section 1.4.
+"""
+import hashlib
+import logging
+import re
+import time
+import uuid
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Optional
+import aiohttp
+import chromadb
+from . import db
+logger = logging.getLogger("aoms.cortex")
+OLLAMA_URL = "http://localhost:11434"
+GENERATION_MODEL = "deepseek-r1:7b"
+L0_MAX_TOKENS = 100
+L1_MAX_TOKENS = 2000
+L2_STORAGE_ROOT = Path("/home/dhawal/cortex-mem/cortex-mem/cortex/l2_docs")
+CHROMA_PATH = Path("/home/dhawal/cortex-mem/cortex-mem/index/chroma")
+L0_PROMPT = """Summarize in ONE sentence (max 100 tokens): what this document \
+is about, its primary conclusion, and one key differentiator.
+DOCUMENT TYPE: {doc_type}
+HIERARCHY: {hierarchy_path}
+TITLE: {title}
+CONTENT:
+{content}
+ABSTRACT:"""
+L1_PROMPT = """Create a structured overview (under 2000 tokens):
+1. PURPOSE: What this is and why it exists (1-2 sentences)
+2. KEY POINTS: 3-5 most important facts/findings
+3. METRICS: Quantitative results (percentages, performance)
+4. RELATIONSHIPS: What this relates to
+5. ACTIONABILITY: When/how to use this
+Format as clean markdown. Be data-dense.
+DOCUMENT TYPE: {doc_type}
+HIERARCHY: {hierarchy_path}
+TITLE: {title}
+CONTENT:
+{content}
+OVERVIEW:"""
+def _estimate_tokens(text: str) -> int:
+    """Rough token estimate: ~4 chars per token for English."""
+    return len(text) // 4
+def _strip_thinking_tags(text: str) -> str:
+    """Remove <think>...</think> blocks that deepseek-r1 sometimes emits."""
+    return re.sub(r"<think>.*?</think>", "", text, flags=re.DOTALL).strip()
+async def _ollama_generate(prompt: str, max_tokens: int = 2048) -> str:
+    """Call Ollama chat API and return the response text."""
+    payload = {
+        "model": GENERATION_MODEL,
+        "prompt": prompt,
+        "stream": False,
+        "options": {"num_predict": max_tokens, "temperature": 0.3},
+    }
+    async with aiohttp.ClientSession() as session:
+        async with session.post(
+            f"{OLLAMA_URL}/api/generate",
+            json=payload,
+            timeout=aiohttp.ClientTimeout(total=120),
+        ) as resp:
+            if resp.status != 200:
+                body = await resp.text()
+                raise RuntimeError(f"Ollama returned {resp.status}: {body}")
+            data = await resp.json()
+            return _strip_thinking_tags(data.get("response", ""))
+def _get_chroma_client() -> chromadb.ClientAPI:
+    CHROMA_PATH.mkdir(parents=True, exist_ok=True)
+    return chromadb.PersistentClient(path=str(CHROMA_PATH))
+class TierGenerator:
+    """Auto-generates L0 and L1 tiers from L2 content."""
+    def __init__(self, db_conn=None):
+        self.conn = db_conn or db.init_db()
+        self._chroma = None
+    @property
+    def chroma(self):
+        if self._chroma is None:
+            self._chroma = _get_chroma_client()
+        return self._chroma
+    @property
+    def l0_collection(self):
+        return self.chroma.get_or_create_collection(
+            "cortex_l0", metadata={"hnsw:space": "cosine"}
+        )
+    @property
+    def l1_collection(self):
+        return self.chroma.get_or_create_collection(
+            "cortex_l1", metadata={"hnsw:space": "cosine"}
+        )
+    async def ingest_document(
+        self,
+        content: str,
+        title: str,
+        hierarchy_path: str,
+        doc_type: str = "reference",
+        tags: Optional[list] = None,
+        source_file: Optional[str] = None,
+    ) -> str:
+        """
+        Full pipeline: store L2, generate L0/L1, index in ChromaDB, save metadata.
+        Returns doc_id.
+        """
+        doc_id = str(uuid.uuid4())
+        now = datetime.now(timezone.utc).isoformat()
+        l2_checksum = hashlib.sha256(content.encode()).hexdigest()
+        # 1. Store L2 on filesystem
+        l2_path = self._resolve_l2_path(hierarchy_path, title)
+        l2_path.parent.mkdir(parents=True, exist_ok=True)
+        l2_path.write_text(content, encoding="utf-8")
+        l2_tokens = _estimate_tokens(content)
+        logger.info(f"Ingesting '{title}' ({l2_tokens} tokens) → generating L0/L1...")
+        # 2. Generate L0 via Ollama
+        t0 = time.monotonic()
+        l0_abstract = await self._generate_l0(content, title, hierarchy_path, doc_type)
+        l0_tokens = _estimate_tokens(l0_abstract)
+        logger.info(f"  L0 generated: {l0_tokens} tokens ({time.monotonic()-t0:.1f}s)")
+        # 3. Generate L1 via Ollama
+        t1 = time.monotonic()
+        l1_overview = await self._generate_l1(content, title, hierarchy_path, doc_type)
+        l1_tokens = _estimate_tokens(l1_overview)
+        logger.info(f"  L1 generated: {l1_tokens} tokens ({time.monotonic()-t1:.1f}s)")
+        # 4. Index in ChromaDB
+        self.l0_collection.upsert(
+            ids=[doc_id],
+            documents=[l0_abstract],
+            metadatas=[{"title": title, "hierarchy_path": hierarchy_path, "doc_type": doc_type}],
+        )
+        self.l1_collection.upsert(
+            ids=[doc_id],
+            documents=[l1_overview],
+            metadatas=[{"title": title, "hierarchy_path": hierarchy_path, "doc_type": doc_type}],
+        )
+        # 5. Save to SQLite
+        parent_path = "/".join(hierarchy_path.rstrip("/").split("/")[:-1]) or "/"
+        depth = hierarchy_path.strip("/").count("/")
+        db.insert_document(self.conn, {
+            "doc_id": doc_id,
+            "hierarchy_path": hierarchy_path,
+            "title": title,
+            "doc_type": doc_type,
+            "l0_abstract": l0_abstract,
+            "l0_token_count": l0_tokens,
+            "l1_overview": l1_overview,
+            "l1_token_count": l1_tokens,
+            "l2_file_path": str(l2_path),
+            "l2_token_count": l2_tokens,
+            "l2_checksum": l2_checksum,
+            "chromadb_l0_id": doc_id,
+            "chromadb_l1_id": doc_id,
+            "parent_path": parent_path,
+            "depth": depth,
+            "tags": tags or [],
+            "l0_generated_at": now,
+            "l1_generated_at": now,
+            "source_type": "file" if source_file else "manual",
+        })
+        total_time = time.monotonic() - t0
+        logger.info(
+            f"  Ingested '{title}': L2={l2_tokens}tok → L0={l0_tokens}tok + L1={l1_tokens}tok "
+            f"({(1 - (l0_tokens + l1_tokens) / max(l2_tokens, 1)) * 100:.0f}% reduction, {total_time:.1f}s)"
+        )
+        return doc_id
+    async def regenerate(self, doc_id: str) -> bool:
+        """Re-generate L0/L1 for an existing document (e.g., after L2 update)."""
+        doc = db.get_document(self.conn, doc_id)
+        if doc is None:
+            return False
+        l2_path = Path(doc["l2_file_path"])
+        if not l2_path.exists():
+            logger.error(f"L2 file missing for {doc_id}: {l2_path}")
+            return False
+        content = l2_path.read_text(encoding="utf-8")
+        now = datetime.now(timezone.utc).isoformat()
+        l0 = await self._generate_l0(content, doc["title"], doc["hierarchy_path"], doc["doc_type"])
+        l1 = await self._generate_l1(content, doc["title"], doc["hierarchy_path"], doc["doc_type"])
+        self.conn.execute(
+            """
+            UPDATE documents SET
+                l0_abstract = ?, l0_token_count = ?,
+                l1_overview = ?, l1_token_count = ?,
+                l2_checksum = ?, l2_token_count = ?,
+                is_stale = 0, stale_reason = NULL,
+                l0_generated_at = ?, l1_generated_at = ?
+            WHERE doc_id = ?
+            """,
+            (
+                l0, _estimate_tokens(l0),
+                l1, _estimate_tokens(l1),
+                hashlib.sha256(content.encode()).hexdigest(),
+                _estimate_tokens(content),
+                now, now, doc_id,
+            ),
+        )
+        self.conn.commit()
+        self.l0_collection.upsert(ids=[doc_id], documents=[l0])
+        self.l1_collection.upsert(ids=[doc_id], documents=[l1])
+        logger.info(f"Regenerated L0/L1 for '{doc['title']}'")
+        return True
+    async def _generate_l0(
+        self, content: str, title: str, hierarchy_path: str, doc_type: str
+    ) -> str:
+        truncated = content[:12000]
+        prompt = L0_PROMPT.format(
+            doc_type=doc_type,
+            hierarchy_path=hierarchy_path,
+            title=title,
+            content=truncated,
+        )
+        result = await _ollama_generate(prompt, max_tokens=400)
+        if len(result.split()) < 10:
+            logger.warning(f"L0 too short ({len(result.split())} words), using title-based fallback")
+            first_500 = content[:2000].replace("\n", " ").strip()
+            result = f"{title}: {first_500[:300]}"
+        return result
+    async def _generate_l1(
+        self, content: str, title: str, hierarchy_path: str, doc_type: str
+    ) -> str:
+        truncated = content[:16000]
+        prompt = L1_PROMPT.format(
+            doc_type=doc_type,
+            hierarchy_path=hierarchy_path,
+            title=title,
+            content=truncated,
+        )
+        return await _ollama_generate(prompt, max_tokens=3000)
+    def _resolve_l2_path(self, hierarchy_path: str, title: str) -> Path:
+        safe_title = re.sub(r"[^\w\-.]", "_", title)[:80]
+        return L2_STORAGE_ROOT / hierarchy_path.strip("/") / f"{safe_title}.md"