PyPI - cortext-memory - Versions diffs - 0.1.0__tar.gz - Mend

cortext-memory 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

cortext_memory-0.1.0/LICENSE +21 -0
cortext_memory-0.1.0/PKG-INFO +194 -0
cortext_memory-0.1.0/README.md +162 -0
cortext_memory-0.1.0/cortext/__init__.py +72 -0
cortext_memory-0.1.0/cortext/core/__init__.py +1 -0
cortext_memory-0.1.0/cortext/core/decay/__init__.py +23 -0
cortext_memory-0.1.0/cortext/core/decay/ebbinghaus.py +126 -0
cortext_memory-0.1.0/cortext/core/decay/forget_gate.py +169 -0
cortext_memory-0.1.0/cortext/core/entity.py +85 -0
cortext_memory-0.1.0/cortext/core/graph.py +226 -0
cortext_memory-0.1.0/cortext/core/memory.py +253 -0
cortext_memory-0.1.0/cortext/core/recall/__init__.py +38 -0
cortext_memory-0.1.0/cortext/core/recall/embedding.py +157 -0
cortext_memory-0.1.0/cortext/core/recall/extractor.py +132 -0
cortext_memory-0.1.0/cortext/core/recall/extractors/__init__.py +19 -0
cortext_memory-0.1.0/cortext/core/recall/extractors/regex_lang.py +335 -0
cortext_memory-0.1.0/cortext/core/recall/pack.py +81 -0
cortext_memory-0.1.0/cortext/core/recall/parser.py +194 -0
cortext_memory-0.1.0/cortext/core/recall/text_extractor.py +224 -0
cortext_memory-0.1.0/cortext/core/relation.py +138 -0
cortext_memory-0.1.0/cortext/core/validation/__init__.py +19 -0
cortext_memory-0.1.0/cortext/core/validation/canonical.py +448 -0
cortext_memory-0.1.0/cortext/cortex.py +325 -0
cortext_memory-0.1.0/cortext/integration/__init__.py +5 -0
cortext_memory-0.1.0/cortext/integration/hermes_bridge.py +138 -0
cortext_memory-0.1.0/cortext/workers/__init__.py +5 -0
cortext_memory-0.1.0/cortext/workers/dream_agent.py +293 -0
cortext_memory-0.1.0/cortext_memory.egg-info/PKG-INFO +194 -0
cortext_memory-0.1.0/cortext_memory.egg-info/SOURCES.txt +35 -0
cortext_memory-0.1.0/cortext_memory.egg-info/dependency_links.txt +1 -0
cortext_memory-0.1.0/cortext_memory.egg-info/requires.txt +15 -0
cortext_memory-0.1.0/cortext_memory.egg-info/top_level.txt +1 -0
cortext_memory-0.1.0/pyproject.toml +55 -0
cortext_memory-0.1.0/setup.cfg +4 -0
cortext_memory-0.1.0/tests/test_cortext.py +243 -0
cortext_memory-0.1.0/tests/test_definitive.py +194 -0
cortext_memory-0.1.0/tests/test_hermes_bridge.py +112 -0

cortext_memory-0.1.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Jhony Miler
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

cortext_memory-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,194 @@
+Metadata-Version: 2.4
+Name: cortext-memory
+Version: 0.1.0
+Summary: Cognitive memory for AI agents — W5H-structured, contradiction-aware, internationalized, token-efficient
+Author-email: Jhony Miler <jonatasmiler@gmail.com>
+License: MIT
+Project-URL: Homepage, https://github.com/jhonymiler/Cortex
+Project-URL: Repository, https://github.com/jhonymiler/Cortex
+Project-URL: Issues, https://github.com/jhonymiler/Cortex/issues
+Keywords: memory,agents,llm,ai,rag
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0; extra == "dev"
+Requires-Dist: pytest-cov>=4.0; extra == "dev"
+Requires-Dist: ruff>=0.1; extra == "dev"
+Provides-Extra: ollama
+Provides-Extra: openai
+Provides-Extra: embeddings
+Requires-Dist: sentence-transformers>=2.2; extra == "embeddings"
+Provides-Extra: all
+Requires-Dist: sentence-transformers>=2.2; extra == "all"
+Dynamic: license-file
+# Cortex
+*Read this in [Português](README.pt-br.md).*
+> **A cognitive memory system for AI agents — structured, internationalized, contradiction-aware, and token-efficient.**
+Cortex gives an LLM agent a long-term memory that is *structured* rather than a
+flat vector store. Every memory is decomposed into a **W5H** record (who, what,
+why, when, where, how), validated against what is already known so the agent
+does not silently store contradictions, and recalled through a deterministic
+structural parser that returns a **compact** context string instead of a wall
+of raw chunks.
+It is a pure Python library with **zero required dependencies**, local-first,
+and designed to plug into an agent loop as a transparent memory layer (recall
+before the turn, store after it).
+```python
+from cortext import CortexV5
+cortex = CortexV5(namespace="myapp")
+# Store a structured memory (W5H)
+cortex.remember(
+    who=["Maria"],
+    what="reportou erro de pagamento",
+    why="cartão expirado",
+    where="suporte",
+    how="orientada a atualizar dados",
+    lang="pt",
+)
+# Recall — returns (compact_context, RecallResult)
+context, result = cortex.recall("O que Maria pediu?")
+print(context)
+# Maria | reportou erro de pagamento
+```
+## Why structured memory
+Most agent memory is "embed the turn, retrieve top-k chunks." That works until
+it doesn't: chunks are bulky, retrieval mixes unrelated facts, and nothing stops
+the store from holding `X` and `not X` at the same time.
+Cortex takes a different stance — memory is **encoded information**, not mere
+correlation. It is built around five structural properties (discrete schema,
+syntax, an arbitrary-but-stable mapping to external referents, an independent
+interpreter, and functional semantics driven by usage). In practice that buys
+you four concrete things:
+| Property | What it means in practice |
+|---|---|
+| **Structured (W5H)** | Recall returns `Maria \| reportou erro → orientada a atualizar dados`, not a 90-token chunk. |
+| **Normative** | A `CanonicalValidator` detects contradictions *at write time* (3 levels: heuristic → embedding → LLM-as-judge) and can warn or block. |
+| **Internationalized** | The W5H schema is language-neutral; only extraction is language-specific, and it is pluggable (PT/EN/ES regex + optional LLM fallback). |
+| **Self-pruning** | Ebbinghaus decay + a forget gate + an optional background `DreamAgent` that replays, consolidates duplicates, and prunes what is no longer used. |
+## Benchmarks
+Reproducible on this repo (`python bench/run_benchmark.py`), comparing Cortex
+against an unstructured top-k baseline across 2 scenarios:
+| Scenario | Tokens (baseline → Cortex) | Savings | P@5 (baseline → Cortex) | Contradiction detection |
+|---|---|---|---|---|
+| customer_support | 540 → 123 | **77.2%** | 0.367 → 0.778 | 100% |
+| personal_assistant | 380 → 111 | **70.8%** | 0.840 → 0.860 | 67% |
+| **Average** | — | **74.0%** | **0.603 → 0.819** | 83.5% |
+- **~74% fewer context tokens** for the same retrieved information.
+- **Precision@5 up from 0.60 to 0.82** — recall returns the *right* memories.
+- **Zero false positives** in contradiction detection across both scenarios.
+- **~0.1 ms** average recall latency (pure Python, in-memory graph).
+Token savings directly cut prompt cost and free context budget for the actual
+task; higher precision means the agent sees fewer irrelevant memories.
+## Install
+```bash
+pip install cortext-memory
+```
+Optional extras:
+```bash
+pip install "cortext-memory[embeddings]"   # sentence-transformers for embedding-level validation
+pip install "cortext-memory[dev]"          # pytest, ruff
+```
+Cortex runs with **no extra dependencies** by default. The embedding and
+LLM-as-judge contradiction levels are opt-in.
+## How it works
+```
+WRITE   text/W5H ──▶ CanonicalValidator (3-level) ──▶ Memory Graph
+                         (warn or block contradictions)
+RECALL  query ──▶ LangDetector ──▶ HybridExtractor ──▶ QueryIntent (W5H)
+                                                            │
+              Memory Graph ──▶ StructuralQueryParser ──▶ pack_for_context
+                                                            │
+                                                   compact context string
+DECAY   Ebbinghaus retrievability + ForgetGate, with an optional background
+        DreamAgent that replays, consolidates duplicates, and prunes.
+```
+### Internationalization
+The W5H schema is universal; **extraction** is the only language-specific part,
+and it is pluggable:
+```python
+from cortext import RegexExtractor, HybridExtractor, LLMExtractor
+extractor = HybridExtractor(
+    primary=RegexExtractor(default_lang="auto"),   # PT, EN, ES — detected per query
+    fallback=LLMExtractor(model_fn=my_llm_call),   # any language, when regex misses
+)
+```
+Recall is matched within the language of the stored content — store and query in
+the same language for best results, or wire an LLM extractor for arbitrary
+languages.
+## Using it inside an agent
+The intended pattern is a transparent memory layer: recall before the LLM call,
+store after it. `HermesCortexBridge` is a reference implementation of exactly
+this:
+```python
+from cortext.integration import HermesCortexBridge
+bridge = HermesCortexBridge(namespace="session-1")
+# Before the LLM call — inject recalled context:
+context = bridge.pre_chat(user_input)
+system_prompt = context + "\n\n" + base_system_prompt
+# After the turn — persist it:
+bridge.post_chat(user_message=user_input, assistant_message=reply)
+```
+See [docs/INTEGRATION.md](docs/INTEGRATION.md) for plugging Cortex into an agent
+(including the Hermes memory plugin) and [docs/ARCHITECTURE.md](docs/ARCHITECTURE.md)
+for the component-by-component design.
+## Development
+```bash
+python -m venv venv && source venv/bin/activate
+pip install -e ".[dev]"
+pytest                                  # 190+ tests
+python bench/run_benchmark.py        # reproduce the benchmarks
+```
+## License
+MIT — see [LICENSE](LICENSE).

cortext_memory-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,162 @@
+# Cortex
+*Read this in [Português](README.pt-br.md).*
+> **A cognitive memory system for AI agents — structured, internationalized, contradiction-aware, and token-efficient.**
+Cortex gives an LLM agent a long-term memory that is *structured* rather than a
+flat vector store. Every memory is decomposed into a **W5H** record (who, what,
+why, when, where, how), validated against what is already known so the agent
+does not silently store contradictions, and recalled through a deterministic
+structural parser that returns a **compact** context string instead of a wall
+of raw chunks.
+It is a pure Python library with **zero required dependencies**, local-first,
+and designed to plug into an agent loop as a transparent memory layer (recall
+before the turn, store after it).
+```python
+from cortext import CortexV5
+cortex = CortexV5(namespace="myapp")
+# Store a structured memory (W5H)
+cortex.remember(
+    who=["Maria"],
+    what="reportou erro de pagamento",
+    why="cartão expirado",
+    where="suporte",
+    how="orientada a atualizar dados",
+    lang="pt",
+)
+# Recall — returns (compact_context, RecallResult)
+context, result = cortex.recall("O que Maria pediu?")
+print(context)
+# Maria | reportou erro de pagamento
+```
+## Why structured memory
+Most agent memory is "embed the turn, retrieve top-k chunks." That works until
+it doesn't: chunks are bulky, retrieval mixes unrelated facts, and nothing stops
+the store from holding `X` and `not X` at the same time.
+Cortex takes a different stance — memory is **encoded information**, not mere
+correlation. It is built around five structural properties (discrete schema,
+syntax, an arbitrary-but-stable mapping to external referents, an independent
+interpreter, and functional semantics driven by usage). In practice that buys
+you four concrete things:
+| Property | What it means in practice |
+|---|---|
+| **Structured (W5H)** | Recall returns `Maria \| reportou erro → orientada a atualizar dados`, not a 90-token chunk. |
+| **Normative** | A `CanonicalValidator` detects contradictions *at write time* (3 levels: heuristic → embedding → LLM-as-judge) and can warn or block. |
+| **Internationalized** | The W5H schema is language-neutral; only extraction is language-specific, and it is pluggable (PT/EN/ES regex + optional LLM fallback). |
+| **Self-pruning** | Ebbinghaus decay + a forget gate + an optional background `DreamAgent` that replays, consolidates duplicates, and prunes what is no longer used. |
+## Benchmarks
+Reproducible on this repo (`python bench/run_benchmark.py`), comparing Cortex
+against an unstructured top-k baseline across 2 scenarios:
+| Scenario | Tokens (baseline → Cortex) | Savings | P@5 (baseline → Cortex) | Contradiction detection |
+|---|---|---|---|---|
+| customer_support | 540 → 123 | **77.2%** | 0.367 → 0.778 | 100% |
+| personal_assistant | 380 → 111 | **70.8%** | 0.840 → 0.860 | 67% |
+| **Average** | — | **74.0%** | **0.603 → 0.819** | 83.5% |
+- **~74% fewer context tokens** for the same retrieved information.
+- **Precision@5 up from 0.60 to 0.82** — recall returns the *right* memories.
+- **Zero false positives** in contradiction detection across both scenarios.
+- **~0.1 ms** average recall latency (pure Python, in-memory graph).
+Token savings directly cut prompt cost and free context budget for the actual
+task; higher precision means the agent sees fewer irrelevant memories.
+## Install
+```bash
+pip install cortext-memory
+```
+Optional extras:
+```bash
+pip install "cortext-memory[embeddings]"   # sentence-transformers for embedding-level validation
+pip install "cortext-memory[dev]"          # pytest, ruff
+```
+Cortex runs with **no extra dependencies** by default. The embedding and
+LLM-as-judge contradiction levels are opt-in.
+## How it works
+```
+WRITE   text/W5H ──▶ CanonicalValidator (3-level) ──▶ Memory Graph
+                         (warn or block contradictions)
+RECALL  query ──▶ LangDetector ──▶ HybridExtractor ──▶ QueryIntent (W5H)
+                                                            │
+              Memory Graph ──▶ StructuralQueryParser ──▶ pack_for_context
+                                                            │
+                                                   compact context string
+DECAY   Ebbinghaus retrievability + ForgetGate, with an optional background
+        DreamAgent that replays, consolidates duplicates, and prunes.
+```
+### Internationalization
+The W5H schema is universal; **extraction** is the only language-specific part,
+and it is pluggable:
+```python
+from cortext import RegexExtractor, HybridExtractor, LLMExtractor
+extractor = HybridExtractor(
+    primary=RegexExtractor(default_lang="auto"),   # PT, EN, ES — detected per query
+    fallback=LLMExtractor(model_fn=my_llm_call),   # any language, when regex misses
+)
+```
+Recall is matched within the language of the stored content — store and query in
+the same language for best results, or wire an LLM extractor for arbitrary
+languages.
+## Using it inside an agent
+The intended pattern is a transparent memory layer: recall before the LLM call,
+store after it. `HermesCortexBridge` is a reference implementation of exactly
+this:
+```python
+from cortext.integration import HermesCortexBridge
+bridge = HermesCortexBridge(namespace="session-1")
+# Before the LLM call — inject recalled context:
+context = bridge.pre_chat(user_input)
+system_prompt = context + "\n\n" + base_system_prompt
+# After the turn — persist it:
+bridge.post_chat(user_message=user_input, assistant_message=reply)
+```
+See [docs/INTEGRATION.md](docs/INTEGRATION.md) for plugging Cortex into an agent
+(including the Hermes memory plugin) and [docs/ARCHITECTURE.md](docs/ARCHITECTURE.md)
+for the component-by-component design.
+## Development
+```bash
+python -m venv venv && source venv/bin/activate
+pip install -e ".[dev]"
+pytest                                  # 190+ tests
+python bench/run_benchmark.py        # reproduce the benchmarks
+```
+## License
+MIT — see [LICENSE](LICENSE).

cortext_memory-0.1.0/cortext/__init__.py ADDED Viewed

@@ -0,0 +1,72 @@
+"""Cortext — Memory system for AI agents.
+5-element detector compliant, internationalized, efficient.
+"""
+from cortext.cortex import CortexV5
+from cortext.core.memory import Memory
+from cortext.core.entity import Entity
+from cortext.core.relation import Relation, RelationType
+from cortext.core.graph import MemoryGraph, RecallResult
+from cortext.core.validation import (
+    CanonicalValidator,
+    ValidationResult,
+    ValidationStatus,
+    ValidationPolicy,
+    create_default_validator,
+    create_strict_validator,
+)
+from cortext.core.recall import (
+    StructuralQueryParser,
+    QueryIntent,
+    pack_for_context,
+    RegexExtractor,
+    LLMExtractor,
+    HybridExtractor,
+)
+from cortext.core.decay import (
+    DecayConfig,
+    retrievability,
+    effective_stability,
+    decay_status,
+    ForgetGate,
+    ForgetGateConfig,
+)
+from cortext.workers import DreamAgent
+__version__ = "0.1.0"
+__all__ = [
+    # Main entry point
+    "CortexV5",
+    # Core data structures
+    "Memory",
+    "Entity",
+    "Relation",
+    "RelationType",
+    "MemoryGraph",
+    "RecallResult",
+    # Validation
+    "CanonicalValidator",
+    "ValidationResult",
+    "ValidationStatus",
+    "ValidationPolicy",
+    "create_default_validator",
+    "create_strict_validator",
+    # Recall
+    "StructuralQueryParser",
+    "QueryIntent",
+    "pack_for_context",
+    "RegexExtractor",
+    "LLMExtractor",
+    "HybridExtractor",
+    # Decay
+    "DecayConfig",
+    "retrievability",
+    "effective_stability",
+    "decay_status",
+    "ForgetGate",
+    "ForgetGateConfig",
+    # Workers
+    "DreamAgent",
+]

cortext_memory-0.1.0/cortext/core/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ """Core data structures: Memory, Entity, Relation, MemoryGraph."""

cortext_memory-0.1.0/cortext/core/decay/__init__.py ADDED Viewed

@@ -0,0 +1,23 @@
+"""
+Decay subsystem: Ebbinghaus R = e^(-t/S) + Forget Gate.
+"""
+from cortext.core.decay.ebbinghaus import (
+    DecayConfig,
+    retrievability,
+    effective_stability,
+    decay_status,
+)
+from cortext.core.decay.forget_gate import (
+    ForgetGate,
+    ForgetGateConfig,
+)
+__all__ = [
+    "DecayConfig",
+    "retrievability",
+    "effective_stability",
+    "decay_status",
+    "ForgetGate",
+    "ForgetGateConfig",
+]

cortext_memory-0.1.0/cortext/core/decay/ebbinghaus.py ADDED Viewed

@@ -0,0 +1,126 @@
+"""
+Ebbinghaus decay — R = e^(-t/S).
+The classic forgetting curve, applied to memory retrieval. Simple,
+universal, and validated empirically (Ebbinghaus, 1885).
+Formula: R = e^(-t/S)
+  - R: retrievability (0.0-1.0)
+  - t: time since last access (days)
+  - S: stability (days) — base × modifiers
+Stability modifiers (extensible):
+  - access_count: more accesses = more stable (log scale)
+  - importance: high importance = more stable
+  - consolidation: consolidated memories = more stable
+  - (custom) user-defined via metadata
+"""
+from __future__ import annotations
+import math
+from dataclasses import dataclass
+from datetime import datetime
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from cortext.core.memory import Memory
+@dataclass
+class DecayConfig:
+    """Tunables for the decay function."""
+    # Base stability (days for 63% decay without reinforcement)
+    base_stability_days: float = 7.0
+    # Stability modifiers
+    access_log_multiplier: float = 1.0      # log(access_count + 1) factor
+    importance_bonus: float = 1.3            # bonus for high importance (>0.7)
+    consolidation_bonus: float = 2.0        # bonus for consolidated memories
+    # Min/max stability (prevent degenerate values)
+    min_stability: float = 0.1
+    max_stability: float = 365.0
+    # Thresholds for status
+    active_threshold: float = 0.7
+    fading_threshold: float = 0.3
+    forgotten_threshold: float = 0.1
+def retrievability(
+    memory: "Memory",
+    now: datetime | None = None,
+    config: DecayConfig | None = None,
+) -> float:
+    """
+    Compute retrievability of a memory using the Ebbinghaus curve.
+    R = e^(-t/S), where S = base_stability × modifiers.
+    Returns:
+        float between 0.0 (forgotten) and 1.0 (fresh)
+    """
+    if config is None:
+        config = DecayConfig()
+    now = now or datetime.now()
+    # Reference time = last access, fallback to creation
+    reference_time = memory.last_accessed or memory.when
+    days_since = max(0.0, (now - reference_time).total_seconds() / 86400)
+    # Compute effective stability
+    s = effective_stability(memory, config)
+    # Ebbinghaus formula
+    return math.exp(-days_since / s)
+def effective_stability(
+    memory: "Memory",
+    config: DecayConfig | None = None,
+) -> float:
+    """
+    Compute the effective stability S for a memory.
+    S = base × access_modifier × importance_modifier × consolidation_modifier
+    """
+    if config is None:
+        config = DecayConfig()
+    s = config.base_stability_days
+    # Access count modifier (logarithmic)
+    access_factor = 1.0 + config.access_log_multiplier * math.log(memory.access_count + 1)
+    s *= access_factor
+    # Importance bonus
+    if memory.importance > 0.7:
+        s *= config.importance_bonus
+    # Consolidation bonus
+    if memory.is_consolidated:
+        s *= config.consolidation_bonus
+    return max(config.min_stability, min(config.max_stability, s))
+def decay_status(
+    memory: "Memory",
+    now: datetime | None = None,
+    config: DecayConfig | None = None,
+) -> str:
+    """
+    Get a categorical status: "active" | "fading" | "weak" | "forgotten".
+    """
+    if config is None:
+        config = DecayConfig()
+    r = retrievability(memory, now, config)
+    if r >= config.active_threshold:
+        return "active"
+    elif r >= config.fading_threshold:
+        return "fading"
+    elif r >= config.forgotten_threshold:
+        return "weak"
+    return "forgotten"