PyPI - hb-cortex-memory - Versions diffs - 0.1.0__py3-none-any.whl - Mend

hb-cortex-memory 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

cortex_memory/__init__.py +126 -0
cortex_memory/_textutil.py +83 -0
cortex_memory/assembly.py +335 -0
cortex_memory/db.py +25 -0
cortex_memory/domains.py +158 -0
cortex_memory/dreaming.py +568 -0
cortex_memory/dreaming_prompts.py +55 -0
cortex_memory/dtos.py +260 -0
cortex_memory/embedding.py +58 -0
cortex_memory/enums.py +78 -0
cortex_memory/episodic_tree.py +466 -0
cortex_memory/experience_tree.py +230 -0
cortex_memory/graph.py +409 -0
cortex_memory/ingestion.py +224 -0
cortex_memory/intelligence_tree.py +275 -0
cortex_memory/knowledge_tree.py +483 -0
cortex_memory/models.py +240 -0
cortex_memory/prompts.py +21 -0
cortex_memory/providers.py +156 -0
cortex_memory/providers_reference.py +121 -0
cortex_memory/py.typed +0 -0
cortex_memory/schema.py +43 -0
cortex_memory/scope_policy.py +53 -0
cortex_memory/service.py +1196 -0
hb_cortex_memory-0.1.0.dist-info/METADATA +168 -0
hb_cortex_memory-0.1.0.dist-info/RECORD +29 -0
hb_cortex_memory-0.1.0.dist-info/WHEEL +5 -0
hb_cortex_memory-0.1.0.dist-info/licenses/LICENSE +201 -0
hb_cortex_memory-0.1.0.dist-info/top_level.txt +1 -0

cortex_memory/__init__.py ADDED Viewed

@@ -0,0 +1,126 @@
+"""
+cortex_memory — the CORTEX hierarchical-memory engine, extracted as a
+host-independent package (Phase 12 track `04`).
+Boundary rule (the whole point of the extraction): **this package never
+imports the host** (`src.ai.*`). The host depends on the package and injects
+its concerns — LLM calls, embeddings, usage metering, run lookups — through the
+Protocols in :mod:`cortex_memory.providers`. A host adapter (the thin
+``cortex_bridge`` that stays in ``src/ai/memory``) implements those Protocols.
+Stage-B status: the data layer (own ``Base`` + ORM models + enums + DTOs) and
+the provider boundary live here. The CORTEX services move in next; see
+``README.md``.
+"""
+from __future__ import annotations
+from cortex_memory.db import Base, metadata
+from cortex_memory.dtos import (
+    DEFAULT_TRUST_BY_SOURCE,
+    CortexCheckpointCreate,
+    CortexNodeContentResponse,
+    CortexNodeCreate,
+    CortexNodeDetailResponse,
+    CortexNodeSummary,
+    CortexRecurseRequest,
+    CortexTreeCreate,
+    CortexTreeListResponse,
+    CortexTreeResponse,
+    CortexViewportResponse,
+    GoalNode,
+    Provenance,
+    SourceType,
+)
+from cortex_memory.enums import (
+    CortexNodeStatus,
+    CortexNodeType,
+    CortexTreeStatus,
+    MemoryDomain,
+    ScopeLevel,
+)
+from cortex_memory.assembly import MemoryAssemblyResult, MemoryAssemblyService
+from cortex_memory.dreaming import DreamingEngine
+from cortex_memory.episodic_tree import EpisodicTreeService
+from cortex_memory.experience_tree import ExperienceTreeService
+from cortex_memory.graph import SemanticGraphService
+from cortex_memory.intelligence_tree import IntelligenceTreeService
+from cortex_memory.knowledge_tree import KnowledgeTreeService
+from cortex_memory.models import CortexEdge, CortexNode, CortexTree
+from cortex_memory.prompts import CORTEX_OPS_HELP
+from cortex_memory.service import (
+    CheckpointData,
+    CortexService,
+    NodeContent,
+    NodeSummaryDTO,
+    Viewport,
+)
+from cortex_memory.providers import (
+    EmbeddingProvider,
+    EmbeddingResult,
+    LLMProvider,
+    LLMResult,
+    RunfRef,
+    RunRef,
+    RunRegistry,
+    UsageReporter,
+)
+from cortex_memory.scope_policy import ScopePolicy, ScopeViolation
+__version__ = "0.1.0"
+__all__ = [
+    # data layer
+    "Base",
+    "metadata",
+    "CortexTree",
+    "CortexNode",
+    "CortexEdge",
+    "CortexTreeStatus",
+    "CortexNodeType",
+    "CortexNodeStatus",
+    "MemoryDomain",
+    "ScopeLevel",
+    # DTOs
+    "Provenance",
+    "SourceType",
+    "DEFAULT_TRUST_BY_SOURCE",
+    "GoalNode",
+    "CortexTreeCreate",
+    "CortexTreeResponse",
+    "CortexTreeListResponse",
+    "CortexNodeSummary",
+    "CortexViewportResponse",
+    "CortexNodeContentResponse",
+    "CortexNodeCreate",
+    "CortexCheckpointCreate",
+    "CortexRecurseRequest",
+    "CortexNodeDetailResponse",
+    # providers
+    "LLMProvider",
+    "LLMResult",
+    "EmbeddingProvider",
+    "EmbeddingResult",
+    "UsageReporter",
+    "RunRegistry",
+    "RunRef",
+    "RunfRef",
+    # service
+    "CortexService",
+    "SemanticGraphService",
+    "KnowledgeTreeService",
+    "EpisodicTreeService",
+    "ExperienceTreeService",
+    "IntelligenceTreeService",
+    "DreamingEngine",
+    "MemoryAssemblyService",
+    "MemoryAssemblyResult",
+    "Viewport",
+    "NodeSummaryDTO",
+    "NodeContent",
+    "CheckpointData",
+    "CORTEX_OPS_HELP",
+    # tree primitives
+    "ScopePolicy",
+    "ScopeViolation",
+    "__version__",
+]

cortex_memory/_textutil.py ADDED Viewed

@@ -0,0 +1,83 @@
+"""
+cortex_memory._textutil — small pure text helpers (vendored, host-free).
+These are tiny utility functions the CORTEX services use; vendored into the
+package so it carries no dependency on the host's ``ai.shared`` utilities.
+"""
+from __future__ import annotations
+import json
+import logging
+import re
+from typing import Any, Dict, List, Optional, cast
+logger = logging.getLogger(__name__)
+def truncate_for_storage(data: Any, max_chars: int = 400) -> str:
+    """Convert any value to a short readable string for episodic storage."""
+    if data is None:
+        return ""
+    if isinstance(data, str):
+        return data[:max_chars]
+    try:
+        s = json.dumps(data, default=str)
+    except Exception:
+        s = str(data)
+    return s[:max_chars]
+def strip_markdown_fences(text: str) -> str:
+    """Remove ```json ... ``` fences from LLM output."""
+    text = text.strip()
+    if text.startswith("```"):
+        lines = text.split("\n")
+        end = -1 if lines[-1].strip() == "```" else len(lines)
+        text = "\n".join(lines[1:end])
+    return text.strip()
+def parse_json_array(text: str, warn_label: str = "LLM output") -> List[Dict[str, Any]]:
+    """Parse a JSON array from LLM output (markdown-fence aware). [] on failure."""
+    text = strip_markdown_fences(text)
+    try:
+        result = json.loads(text)
+        if isinstance(result, list):
+            return cast(List[Dict[str, Any]], result)
+    except json.JSONDecodeError:
+        pass
+    match = re.search(r"\[.*\]", text, re.DOTALL)
+    if match:
+        try:
+            return cast(List[Dict[str, Any]], json.loads(match.group()))
+        except json.JSONDecodeError:
+            pass
+    logger.warning(f"Failed to parse JSON array from {warn_label}: {text[:200]}")
+    return []
+def parse_json_object(text: str, warn_label: str = "LLM output") -> Optional[Dict[str, Any]]:
+    """Parse a JSON object from LLM output (markdown-fence aware). None on failure."""
+    text = strip_markdown_fences(text)
+    try:
+        result = json.loads(text)
+        if isinstance(result, dict):
+            return cast(Dict[str, Any], result)
+    except json.JSONDecodeError:
+        pass
+    match = re.search(r"\{.*\}", text, re.DOTALL)
+    if match:
+        try:
+            return cast(Dict[str, Any], json.loads(match.group()))
+        except json.JSONDecodeError:
+            pass
+    logger.warning(f"Failed to parse JSON object from {warn_label}: {text[:200]}")
+    return None
+__all__ = [
+    "truncate_for_storage",
+    "strip_markdown_fences",
+    "parse_json_array",
+    "parse_json_object",
+]

cortex_memory/assembly.py ADDED Viewed

@@ -0,0 +1,335 @@
+"""
+memory_assembly_service.py — Unified Memory Assembly Pipeline (Phase F)
+Central orchestrator that replaces MemoryRouter.retrieve() with a
+comprehensive assembly that draws from all four memory domains:
+  - Knowledge (reference nodes from persistent KB trees)
+  - Experience (suggestions from learned patterns)
+  - Intelligence (distilled rules and strategies)
+  - Episodic (recent execution history)
+Usage:
+    assembler = MemoryAssemblyService(db, company_id)
+    result = await assembler.assemble_runtime_memory(
+        entity_id=entity_id,
+        task_description="Analyze Q3 revenue trends",
+    )
+    prompt_text = result.formatted_prompt
+"""
+from __future__ import annotations
+import json
+import logging
+from dataclasses import dataclass, field
+from datetime import datetime, timedelta
+from typing import Any, Dict, List, Optional
+from uuid import UUID
+from sqlalchemy.ext.asyncio import AsyncSession
+logger = logging.getLogger(__name__)
+@dataclass
+class MemoryAssemblyResult:
+    """Container for assembled memory from all four domains."""
+    knowledge_refs: List[Dict[str, Any]] = field(default_factory=list)
+    experience_suggestions: List[Dict[str, Any]] = field(default_factory=list)
+    intelligence_rules: List[Dict[str, Any]] = field(default_factory=list)
+    episodic_context: List[Dict[str, Any]] = field(default_factory=list)
+    formatted_prompt: str = ""
+class MemoryAssemblyService:
+    """
+    Unified Memory Assembly Pipeline for v2.
+    Replaces MemoryRouter.retrieve() with a comprehensive assembly
+    that draws from all four memory domains.
+    """
+    def __init__(
+        self,
+        db: AsyncSession,
+        company_id: UUID,
+        *,
+        embedding: Any = None,
+        llm: Any = None,
+        child_run_factory: Any = None,
+    ):
+        self.db = db
+        self.company_id = company_id
+        # Injected cortex_memory providers, passed down to the graph / domain /
+        # CORTEX services this assembler constructs.
+        self._embedding = embedding
+        self._llm = llm
+        self._child_run_factory = child_run_factory
+    async def assemble_runtime_memory(
+        self,
+        entity_id: UUID,
+        user_id: Optional[UUID] = None,
+        task_description: str = "",
+        runtime_tree: Any = None,
+        include_domains: Optional[List[str]] = None,
+    ) -> MemoryAssemblyResult:
+        """
+        Assemble memory from all four domains for a new execution.
+        Returns a MemoryAssemblyResult containing domain-specific data
+        and a pre-formatted prompt string for system prompt injection.
+        """
+        domains = include_domains or ["knowledge", "experience", "intelligence", "episodic"]
+        result = MemoryAssemblyResult()
+        # 1. KNOWLEDGE ASSEMBLY
+        if "knowledge" in domains:
+            result.knowledge_refs = await self._assemble_knowledge(
+                entity_id, task_description, runtime_tree,
+            )
+        # 2. EXPERIENCE RETRIEVAL
+        if "experience" in domains:
+            result.experience_suggestions = await self._retrieve_experience(
+                entity_id, task_description,
+            )
+        # 3. INTELLIGENCE INJECTION
+        if "intelligence" in domains:
+            result.intelligence_rules = await self._retrieve_intelligence(
+                entity_id, task_description,
+            )
+        # 4. EPISODIC CONTEXT
+        if "episodic" in domains:
+            result.episodic_context = await self._retrieve_episodic(
+                entity_id, user_id, task_description,
+            )
+        # 5. Format for prompt
+        result.formatted_prompt = self._format_assembled_memory(result)
+        return result
+    # ===================================================================
+    # Domain Assemblers
+    # ===================================================================
+    async def _assemble_knowledge(
+        self,
+        entity_id: UUID,
+        task_description: str,
+        runtime_tree: Any = None,
+    ) -> List[Dict[str, Any]]:
+        """
+        Find relevant knowledge nodes via semantic graph search.
+        Creates reference nodes in runtime tree if available.
+        """
+        try:
+            from cortex_memory.graph import SemanticGraphService
+            graph = SemanticGraphService(self.db, self.company_id, embedding=self._embedding)
+            results = await graph.semantic_graph_search(
+                query=task_description,
+                entity_id=entity_id,
+                domains=["knowledge"],
+                top_k=10,
+                graph_expansion_depth=1,
+            )
+            if results and runtime_tree:
+                await self._create_runtime_knowledge_refs(runtime_tree, results[:5])
+            return results or []
+        except Exception as e:
+            logger.debug(f"Knowledge assembly failed: {e}")
+            return []
+    async def _create_runtime_knowledge_refs(self, runtime_tree: Any, results: Any) -> None:
+        """Create reference nodes in the runtime tree's knowledge root."""
+        try:
+            from cortex_memory.service import CortexService
+            cortex = CortexService(self.db, self.company_id, llm=self._llm, child_run_factory=self._child_run_factory)
+            knowledge_root = await cortex.get_knowledge_root(runtime_tree.id)
+            if not knowledge_root:
+                return
+            for item in results:
+                try:
+                    await cortex.write(
+                        parent_id=knowledge_root.id,
+                        node_type="knowledge",
+                        title=f"📎 {item.get('title', 'Reference')[:100]}",
+                        summary=item.get("summary", ""),
+                        content=None,
+                        source_ref={
+                            "ref_type": "cortex_node",
+                            "source_tree_id": item.get("tree_id"),
+                            "source_node_id": item.get("node_id"),
+                            "relevance_score": item.get("combined_score", 0),
+                        },
+                    )
+                except Exception:
+                    pass
+        except Exception as e:
+            logger.debug(f"Runtime knowledge reference creation failed: {e}")
+    async def _retrieve_experience(
+        self,
+        entity_id: UUID,
+        task_description: str,
+    ) -> List[Dict[str, Any]]:
+        """Query Experience Tree for suggestions relevant to the current task."""
+        try:
+            from cortex_memory.graph import SemanticGraphService
+            graph = SemanticGraphService(self.db, self.company_id, embedding=self._embedding)
+            results = await graph.semantic_graph_search(
+                query=task_description,
+                entity_id=entity_id,
+                domains=["experience"],
+                top_k=5,
+            )
+            return [
+                {
+                    "suggestion": r.get("summary", ""),
+                    "type": r.get("node_type"),
+                    "confidence": r.get("combined_score", 0),
+                }
+                for r in (results or [])
+                if r.get("node_type") in ("suggestion", "pattern", "observation")
+            ]
+        except Exception as e:
+            logger.debug(f"Experience retrieval failed: {e}")
+            return []
+    async def _retrieve_intelligence(
+        self,
+        entity_id: UUID,
+        task_description: str,
+    ) -> List[Dict[str, Any]]:
+        """Query Intelligence Tree for applicable rules."""
+        try:
+            from cortex_memory.intelligence_tree import IntelligenceTreeService
+            intelligence_svc = IntelligenceTreeService(self.db, self.company_id, embedding=self._embedding)
+            return await intelligence_svc.get_applicable_rules(
+                entity_id=entity_id,
+                task_description=task_description,
+                max_rules=10,
+            )
+        except Exception as e:
+            logger.debug(f"Intelligence retrieval failed: {e}")
+            return []
+    async def _retrieve_episodic(
+        self,
+        entity_id: UUID,
+        user_id: Optional[UUID] = None,
+        task_description: str = "",
+    ) -> List[Dict[str, Any]]:
+        """Retrieve recent and topically relevant episodes."""
+        try:
+            from cortex_memory.episodic_tree import EpisodicTreeService
+            episodic_svc = EpisodicTreeService(self.db, self.company_id, embedding=self._embedding)
+            # Recent episodes
+            recent = await episodic_svc.get_recent_episodes(
+                entity_id=entity_id, limit=5,
+            )
+            # Topic-relevant episodes (semantic)
+            relevant = []
+            if task_description:
+                try:
+                    relevant_raw = await episodic_svc.query_by_topic(
+                        entity_id=entity_id,
+                        query=task_description,
+                        top_k=3,
+                    )
+                    for ep in relevant_raw:
+                        relevant.append({
+                            "input": ep.get("content", ""),
+                            "output": ep.get("summary", ""),
+                            "status": (ep.get("metadata") or {}).get("status", ""),
+                            "at": ep.get("created_at", ""),
+                        })
+                except Exception:
+                    pass
+            # Merge and deduplicate
+            seen = set()
+            episodes = []
+            for ep in recent + relevant:
+                key = ep.get("at", "") + ep.get("input", "")[:50]
+                if key not in seen:
+                    episodes.append(ep)
+                    seen.add(key)
+            return episodes[:10]
+        except Exception as e:
+            logger.debug(f"Episodic retrieval failed: {e}")
+            return []
+    # ===================================================================
+    # Prompt Formatting
+    # ===================================================================
+    def _format_assembled_memory(self, result: MemoryAssemblyResult) -> str:
+        """
+        Format assembled memory into structured prompt text.
+        Layout:
+          [INTELLIGENCE] — Rules and strategies (highest priority)
+          [KNOWLEDGE] — Relevant KB references
+          [EXPERIENCE] — Suggestions from past patterns
+          [EPISODIC] — Recent execution history
+        """
+        parts = []
+        # Intelligence Rules (highest priority — goes first)
+        if result.intelligence_rules:
+            rule_lines = []
+            for rule in result.intelligence_rules:
+                confidence = rule.get("confidence", 0.5)
+                emoji = {
+                    "instruction": "📏",
+                    "strategy": "🎯",
+                    "preference": "❤️",
+                }.get(rule.get("type", ""), "💡")
+                rule_lines.append(
+                    f"  {emoji} [{confidence:.0%}] {rule.get('rule', rule.get('title', ''))}"
+                )
+            parts.append(
+                "## Learned Intelligence\n"
+                "The following rules have been learned from past experience:\n"
+                + "\n".join(rule_lines)
+            )
+        # Knowledge References
+        if result.knowledge_refs:
+            kb_lines = [
+                f"  📎 [{r.get('combined_score', 0):.2f}] "
+                f"{r.get('title', 'Untitled')}: {r.get('summary', '')[:200]}"
+                for r in result.knowledge_refs[:5]
+            ]
+            parts.append("## Relevant Knowledge\n" + "\n".join(kb_lines))
+        # Experience Suggestions
+        if result.experience_suggestions:
+            exp_lines = [
+                f"  💡 [{s.get('confidence', 0):.2f}] {s.get('suggestion', '')[:200]}"
+                for s in result.experience_suggestions
+            ]
+            parts.append("## Experience Suggestions\n" + "\n".join(exp_lines))
+        # Episodic Context
+        if result.episodic_context:
+            ep_lines = []
+            for ep in result.episodic_context[:5]:
+                inp = (ep.get("input") or "")[:150]
+                out = (ep.get("output") or "")[:150]
+                at = ep.get("at", "")
+                ep_lines.append(f"  [{at}] {inp!r} → {out!r}")
+            parts.append("## Recent Execution History\n" + "\n".join(ep_lines))
+        return "\n\n".join(parts)

cortex_memory/db.py ADDED Viewed

@@ -0,0 +1,25 @@
+"""
+cortex_memory.db — the package's own SQLAlchemy declarative base.
+The package owns its ``Base`` (plan `04` decision K4) so it can ship its own
+schema + Alembic migrations and be installed standalone. The host shares this
+metadata during the in-host phase (its Alembic ``target_metadata`` is a list
+including ``cortex_memory.db.metadata``) so host autogenerate never drops the
+CORTEX tables.
+External references (company/user/entity/run) are **opaque nullable UUIDs**
+(decision K5): no ``ForeignKey`` to host tables, so the package's schema stands
+alone. The host enforces referential integrity in its own schema.
+"""
+from __future__ import annotations
+from sqlalchemy.orm import DeclarativeBase
+class Base(DeclarativeBase):
+    """The package's declarative base (SQLAlchemy 2.0, typed)."""
+metadata = Base.metadata
+__all__ = ["Base", "metadata"]