PyPI - memex-python - Versions diffs - 0.13.0__py3-none-any.whl - Mend

memex-python 0.13.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

memex/__init__.py +336 -0
memex/_time.py +26 -0
memex/_uuid.py +62 -0
memex/bulk.py +138 -0
memex/commands.py +75 -0
memex/envelope.py +69 -0
memex/errors.py +51 -0
memex/factories.py +97 -0
memex/graph.py +30 -0
memex/integrity.py +317 -0
memex/intent.py +318 -0
memex/models.py +271 -0
memex/query.py +435 -0
memex/reducer.py +151 -0
memex/replay.py +144 -0
memex/retrieval.py +266 -0
memex/schemas.py +67 -0
memex/serialization.py +47 -0
memex/stats.py +71 -0
memex/store.py +222 -0
memex/task.py +361 -0
memex/transplant.py +480 -0
memex_python-0.13.0.dist-info/METADATA +150 -0
memex_python-0.13.0.dist-info/RECORD +26 -0
memex_python-0.13.0.dist-info/WHEEL +4 -0
memex_python-0.13.0.dist-info/licenses/LICENSE +190 -0

memex/query.py ADDED Viewed

@@ -0,0 +1,435 @@
+"""Filtering, scoring, decay, sorting, and neighborhood navigation.
+Iteration order follows insertion order everywhere (Python ``dict`` preserves it,
+matching JS ``Map``), so result ordering is identical to the TS library. The
+multi-sort comparator is ported via ``functools.cmp_to_key`` to reproduce the JS
+comparator exactly, including its stable tie-breaking.
+"""
+from __future__ import annotations
+import math
+from functools import cmp_to_key
+from typing import Any
+from pydantic import BaseModel
+from . import _time
+from ._uuid import safe_extract_timestamp
+from .errors import InvalidTimestampError
+from .graph import GraphState
+from .models import (
+    DecayConfig,
+    Edge,
+    EdgeFilter,
+    MemoryFilter,
+    MemoryItem,
+    QueryOptions,
+    Range,
+    ScoredItem,
+    ScoreWeights,
+    SortOption,
+)
+__all__ = [
+    "ScoredQueryOptions",
+    "matches_filter",
+    "extract_timestamp",
+    "get_items",
+    "get_scored_items",
+    "get_edges",
+    "get_item_by_id",
+    "get_edge_by_id",
+    "get_related_items",
+    "get_parents",
+    "get_children",
+    "compute_decay_multiplier",
+    "compute_score",
+    "get_sort_value",
+]
+_MISSING = object()
+INTERVAL_MS: dict[str, int] = {
+    "hour": 3_600_000,
+    "day": 86_400_000,
+    "week": 604_800_000,
+}
+# ---------------------------------------------------------------------------
+# Coercion helpers — public functions accept models OR plain dicts (D5/ergonomics)
+# ---------------------------------------------------------------------------
+def _coerce_filter(f: MemoryFilter | dict[str, Any] | None) -> MemoryFilter | None:
+    if f is None or isinstance(f, MemoryFilter):
+        return f
+    return MemoryFilter.model_validate(f)
+def _coerce_options(o: QueryOptions | dict[str, Any] | None) -> QueryOptions | None:
+    if o is None or isinstance(o, QueryOptions):
+        return o
+    return QueryOptions.model_validate(o)
+def _coerce_weights(w: ScoreWeights | dict[str, Any]) -> ScoreWeights:
+    if isinstance(w, ScoreWeights):
+        return w
+    return ScoreWeights.model_validate(w)
+def _coerce_edge_filter(f: EdgeFilter | dict[str, Any] | None) -> EdgeFilter | None:
+    if f is None or isinstance(f, EdgeFilter):
+        return f
+    return EdgeFilter.model_validate(f)
+# ---------------------------------------------------------------------------
+# Timestamp helpers
+# ---------------------------------------------------------------------------
+def extract_timestamp(uuid_id: str) -> int:
+    """Extract the ms timestamp from a UUIDv7 id, raising on anything else."""
+    ts = safe_extract_timestamp(uuid_id)
+    if ts is None:
+        raise InvalidTimestampError(
+            f'Cannot extract timestamp: "{uuid_id}" is not a valid UUIDv7'
+        )
+    return ts
+def _item_timestamp(item: MemoryItem) -> int:
+    ts = item.created_at if item.created_at is not None else safe_extract_timestamp(item.id)
+    if ts is None:
+        raise InvalidTimestampError(
+            f'Cannot determine timestamp for item "{item.id}": '
+            "set created_at or use a UUIDv7 id"
+        )
+    return ts
+# ---------------------------------------------------------------------------
+# Filtering
+# ---------------------------------------------------------------------------
+def _resolve_path(obj: Any, path: str) -> Any:
+    current = obj
+    for segment in path.split("."):
+        if not isinstance(current, dict) or segment not in current:
+            return _MISSING
+        current = current[segment]
+    return current
+def _matches_range(value: float | None, rng: Range | None) -> bool:
+    if rng is None:
+        return True
+    if rng.min is not None and (value is None or value < rng.min):
+        return False
+    if rng.max is not None and (value is None or value > rng.max):
+        return False
+    return True
+def matches_filter(item: MemoryItem, f: MemoryFilter) -> bool:
+    if f.ids is not None and item.id not in f.ids:
+        return False
+    if f.scope is not None and item.scope != f.scope:
+        return False
+    if f.scope_prefix is not None and not item.scope.startswith(f.scope_prefix):
+        return False
+    if f.author is not None and item.author != f.author:
+        return False
+    if f.kind is not None and item.kind != f.kind:
+        return False
+    if f.source_kind is not None and item.source_kind != f.source_kind:
+        return False
+    if f.intent_id is not None and item.intent_id != f.intent_id:
+        return False
+    if f.intent_ids is not None and (
+        item.intent_id is None or item.intent_id not in f.intent_ids
+    ):
+        return False
+    if f.task_id is not None and item.task_id != f.task_id:
+        return False
+    if f.task_ids is not None and (
+        item.task_id is None or item.task_id not in f.task_ids
+    ):
+        return False
+    if f.range is not None:
+        if not _matches_range(item.authority, f.range.authority):
+            return False
+        if not _matches_range(item.conviction, f.range.conviction):
+            return False
+        if not _matches_range(item.importance, f.range.importance):
+            return False
+    if f.has_parent is not None:
+        if item.parents is None or f.has_parent not in item.parents:
+            return False
+    if f.is_root is not None:
+        has_parents = item.parents is not None and len(item.parents) > 0
+        if f.is_root and has_parents:
+            return False
+        if not f.is_root and not has_parents:
+            return False
+    if f.parents is not None:
+        p = item.parents or []
+        if f.parents.includes is not None and f.parents.includes not in p:
+            return False
+        if f.parents.includes_any is not None and not any(i in p for i in f.parents.includes_any):
+            return False
+        if f.parents.includes_all is not None and not all(i in p for i in f.parents.includes_all):
+            return False
+        if f.parents.count is not None and not _matches_range(len(p), f.parents.count):
+            return False
+    if f.decay is not None:
+        multiplier = compute_decay_multiplier(item, f.decay.config)
+        if multiplier < f.decay.min:
+            return False
+    if f.created is not None:
+        ts = _item_timestamp(item)
+        if f.created.before is not None and ts >= f.created.before:
+            return False
+        if f.created.after is not None and ts < f.created.after:
+            return False
+    if f.not_ is not None and matches_filter(item, f.not_):
+        return False
+    if f.meta is not None:
+        for path, value in f.meta.items():
+            if _resolve_path(item.meta, path) != value:
+                return False
+    if f.meta_has is not None:
+        for path in f.meta_has:
+            if _resolve_path(item.meta, path) is _MISSING:
+                return False
+    if f.or_:
+        if not any(matches_filter(item, sub) for sub in f.or_):
+            return False
+    return True
+# ---------------------------------------------------------------------------
+# Decay & scoring
+# ---------------------------------------------------------------------------
+def compute_decay_multiplier(item: MemoryItem, decay: DecayConfig) -> float:
+    age_ms = _time.now_ms() - _item_timestamp(item)
+    if age_ms <= 0:
+        return 1.0  # future item (clock skew) — no decay
+    interval_ms = INTERVAL_MS.get(decay.interval)
+    if interval_ms is None:
+        raise ValueError(
+            f'Unknown decay interval: "{decay.interval}". Expected "hour", "day", or "week".'
+        )
+    intervals = age_ms / interval_ms
+    if decay.type == "exponential":
+        return float((1 - decay.rate) ** intervals)
+    if decay.type == "linear":
+        return max(0.0, 1 - decay.rate * intervals)
+    if decay.type == "step":
+        return float((1 - decay.rate) ** math.floor(intervals))
+    raise ValueError(
+        f'Unknown decay type: "{decay.type}". Expected "exponential", "linear", or "step".'
+    )
+def _n(value: float | None) -> float:
+    return value if value is not None else 0.0
+def compute_score(item: MemoryItem, weights: ScoreWeights) -> float:
+    base = (
+        _n(weights.authority) * item.authority
+        + _n(weights.conviction) * _n(item.conviction)
+        + _n(weights.importance) * _n(item.importance)
+    )
+    if weights.decay is None:
+        return base
+    return base * compute_decay_multiplier(item, weights.decay)
+# ---------------------------------------------------------------------------
+# Sorting
+# ---------------------------------------------------------------------------
+def get_sort_value(item: MemoryItem, field: str) -> float:
+    if field == "authority":
+        return item.authority
+    if field == "conviction":
+        return _n(item.conviction)
+    if field == "importance":
+        return _n(item.importance)
+    if field == "recency":
+        return _item_timestamp(item)
+    raise ValueError(
+        f'Unknown sort field: "{field}". '
+        'Expected "authority", "conviction", "importance", or "recency".'
+    )
+def _multi_sort(items: list[MemoryItem], sorts: list[SortOption]) -> list[MemoryItem]:
+    def _cmp(a: MemoryItem, b: MemoryItem) -> int:
+        for s in sorts:
+            va = get_sort_value(a, s.field)
+            vb = get_sort_value(b, s.field)
+            if va < vb:
+                return -1 if s.order == "asc" else 1
+            if va > vb:
+                return 1 if s.order == "asc" else -1
+        return 0
+    return sorted(items, key=cmp_to_key(_cmp))
+# ---------------------------------------------------------------------------
+# Queries
+# ---------------------------------------------------------------------------
+def get_items(
+    state: GraphState,
+    filter: MemoryFilter | dict[str, Any] | None = None,
+    options: QueryOptions | dict[str, Any] | None = None,
+) -> list[MemoryItem]:
+    f = _coerce_filter(filter)
+    if f is None:
+        results = list(state.items.values())
+    else:
+        results = [item for item in state.items.values() if matches_filter(item, f)]
+    opts = _coerce_options(options)
+    if opts is not None and opts.sort is not None:
+        sorts = opts.sort if isinstance(opts.sort, list) else [opts.sort]
+        results = _multi_sort(results, sorts)
+    if opts is not None and (opts.offset is not None or opts.limit is not None):
+        start = opts.offset or 0
+        end = start + opts.limit if opts.limit is not None else None
+        results = results[start:end]
+    return results
+class ScoredQueryOptions(BaseModel):
+    pre: MemoryFilter | None = None
+    post: MemoryFilter | None = None
+    min_score: float | None = None
+    limit: int | None = None
+    offset: int | None = None
+def _coerce_scored_options(
+    o: ScoredQueryOptions | dict[str, Any] | None,
+) -> ScoredQueryOptions | None:
+    if o is None or isinstance(o, ScoredQueryOptions):
+        return o
+    return ScoredQueryOptions.model_validate(o)
+def get_scored_items(
+    state: GraphState,
+    weights: ScoreWeights | dict[str, Any],
+    options: ScoredQueryOptions | dict[str, Any] | None = None,
+) -> list[ScoredItem]:
+    w = _coerce_weights(weights)
+    opts = _coerce_scored_options(options)
+    items = get_items(state, opts.pre if opts else None)
+    scored = [ScoredItem(item=item, score=compute_score(item, w)) for item in items]
+    scored.sort(key=lambda s: s.score, reverse=True)
+    if opts is not None and opts.min_score is not None:
+        scored = [s for s in scored if s.score >= opts.min_score]
+    if opts is not None and opts.post is not None:
+        scored = [s for s in scored if matches_filter(s.item, opts.post)]
+    if opts is not None and (opts.offset is not None or opts.limit is not None):
+        start = opts.offset or 0
+        end = start + opts.limit if opts.limit is not None else None
+        scored = scored[start:end]
+    return scored
+def get_edges(
+    state: GraphState,
+    filter: EdgeFilter | dict[str, Any] | None = None,
+) -> list[Edge]:
+    f = _coerce_edge_filter(filter)
+    active_only = True if f is None or f.active_only is None else f.active_only
+    results: list[Edge] = []
+    for edge in state.edges.values():
+        if active_only and not edge.active:
+            continue
+        if f is not None:
+            if f.from_ is not None and edge.from_ != f.from_:
+                continue
+            if f.to is not None and edge.to != f.to:
+                continue
+            if f.kind is not None and edge.kind != f.kind:
+                continue
+            if f.min_weight is not None and (edge.weight is None or edge.weight < f.min_weight):
+                continue
+        results.append(edge)
+    return results
+def get_item_by_id(state: GraphState, id: str) -> MemoryItem | None:
+    return state.items.get(id)
+def get_edge_by_id(state: GraphState, edge_id: str) -> Edge | None:
+    return state.edges.get(edge_id)
+def get_related_items(
+    state: GraphState,
+    item_id: str,
+    direction: str = "both",
+) -> list[MemoryItem]:
+    related_ids: dict[str, None] = {}  # insertion-ordered set
+    for edge in state.edges.values():
+        if not edge.active:
+            continue
+        if direction in ("from", "both") and edge.from_ == item_id:
+            related_ids[edge.to] = None
+        if direction in ("to", "both") and edge.to == item_id:
+            related_ids[edge.from_] = None
+    related_ids.pop(item_id, None)
+    results: list[MemoryItem] = []
+    for rid in related_ids:
+        item = state.items.get(rid)
+        if item is not None:
+            results.append(item)
+    return results
+def get_parents(state: GraphState, item_id: str) -> list[MemoryItem]:
+    item = state.items.get(item_id)
+    if item is None or not item.parents:
+        return []
+    return [state.items[pid] for pid in item.parents if pid in state.items]
+def get_children(state: GraphState, item_id: str) -> list[MemoryItem]:
+    return [
+        item
+        for item in state.items.values()
+        if item.parents and item_id in item.parents
+    ]

memex/reducer.py ADDED Viewed

@@ -0,0 +1,151 @@
+"""The memory-graph reducer: ``apply_command(state, cmd) -> (new_state, events)``.
+Pure and immutable — every branch returns a fresh :class:`GraphState` (the
+relevant dict is cloned) and never mutates the input. ``merge_item`` /
+``merge_edge`` use ``model_copy(update=...)``, which does NOT re-validate — this
+exactly mirrors the TS guarantee that *factories validate scores, updates do not*.
+"""
+from __future__ import annotations
+from typing import Any, NamedTuple
+from pydantic import BaseModel
+from .commands import (
+    EdgeCreate,
+    EdgeRetract,
+    EdgeUpdate,
+    MemoryCommand,
+    MemoryCommandAdapter,
+    MemoryCreate,
+    MemoryRetract,
+    MemoryUpdate,
+)
+from .errors import (
+    DuplicateEdgeError,
+    DuplicateMemoryError,
+    EdgeNotFoundError,
+    MemoryNotFoundError,
+)
+from .graph import GraphState
+from .models import Edge, MemoryItem, MemoryLifecycleEvent
+__all__ = ["CommandResult", "apply_command", "merge_item", "merge_edge"]
+class CommandResult(NamedTuple):
+    state: GraphState
+    events: list[MemoryLifecycleEvent]
+_EDGE_IMMUTABLE = frozenset({"edge_id", "from", "from_", "to"})
+def _merge_and_prune(base: dict[str, Any], patch: dict[str, Any]) -> dict[str, Any]:
+    """Shallow-merge ``patch`` onto ``base``.
+    The TS version strips ``undefined`` entries before and after merging.
+    Python has no ``undefined``; JS ``null`` maps to ``None`` and is kept. So
+    this is a plain shallow merge — content/meta keys cannot be *deleted* via an
+    update, matching the TS behavior.
+    """
+    return {**base, **patch}
+def merge_item(existing: MemoryItem, partial: dict[str, Any]) -> MemoryItem:
+    """Merge a partial onto an item. ``id`` and ``created_at`` are never changed."""
+    update: dict[str, Any] = {}
+    for key, value in partial.items():
+        if key in ("id", "created_at"):
+            continue
+        if key == "content":
+            update["content"] = _merge_and_prune(existing.content, value)
+        elif key == "meta":
+            update["meta"] = _merge_and_prune(existing.meta or {}, value)
+        else:
+            update[key] = value
+    return existing.model_copy(update=update)
+def merge_edge(existing: Edge, partial: dict[str, Any]) -> Edge:
+    """Merge a partial onto an edge. ``edge_id`` / ``from`` / ``to`` are fixed."""
+    update = {k: v for k, v in partial.items() if k not in _EDGE_IMMUTABLE}
+    return existing.model_copy(update=update)
+def apply_command(state: GraphState, cmd: MemoryCommand | dict[str, Any]) -> CommandResult:
+    command = cmd if isinstance(cmd, BaseModel) else MemoryCommandAdapter.validate_python(cmd)
+    match command:
+        case MemoryCreate(item=item):
+            if item.id in state.items:
+                raise DuplicateMemoryError(item.id)
+            items = {**state.items, item.id: item}
+            return CommandResult(
+                GraphState(items, state.edges),
+                [MemoryLifecycleEvent(type="memory.created", item=item, cause_type="memory.create")],
+            )
+        case MemoryUpdate(item_id=item_id, partial=partial):
+            existing = state.items.get(item_id)
+            if existing is None:
+                raise MemoryNotFoundError(item_id)
+            merged = merge_item(existing, partial)
+            items = {**state.items, item_id: merged}
+            return CommandResult(
+                GraphState(items, state.edges),
+                [MemoryLifecycleEvent(type="memory.updated", item=merged, cause_type="memory.update")],
+            )
+        case MemoryRetract(item_id=item_id):
+            existing = state.items.get(item_id)
+            if existing is None:
+                raise MemoryNotFoundError(item_id)
+            items = dict(state.items)
+            del items[item_id]
+            edges = dict(state.edges)
+            events: list[MemoryLifecycleEvent] = [
+                MemoryLifecycleEvent(type="memory.retracted", item=existing, cause_type="memory.retract")
+            ]
+            for edge_id, edge in state.edges.items():
+                if edge.from_ == item_id or edge.to == item_id:
+                    del edges[edge_id]
+                    events.append(
+                        MemoryLifecycleEvent(type="edge.retracted", edge=edge, cause_type="memory.retract")
+                    )
+            return CommandResult(GraphState(items, edges), events)
+        case EdgeCreate(edge=edge):
+            if edge.edge_id in state.edges:
+                raise DuplicateEdgeError(edge.edge_id)
+            edges = {**state.edges, edge.edge_id: edge}
+            return CommandResult(
+                GraphState(state.items, edges),
+                [MemoryLifecycleEvent(type="edge.created", edge=edge, cause_type="edge.create")],
+            )
+        case EdgeUpdate(edge_id=edge_id, partial=partial):
+            existing_edge = state.edges.get(edge_id)
+            if existing_edge is None:
+                raise EdgeNotFoundError(edge_id)
+            merged_edge = merge_edge(existing_edge, partial)
+            edges = {**state.edges, edge_id: merged_edge}
+            return CommandResult(
+                GraphState(state.items, edges),
+                [MemoryLifecycleEvent(type="edge.updated", edge=merged_edge, cause_type="edge.update")],
+            )
+        case EdgeRetract(edge_id=edge_id):
+            existing_edge = state.edges.get(edge_id)
+            if existing_edge is None:
+                raise EdgeNotFoundError(edge_id)
+            edges = dict(state.edges)
+            del edges[edge_id]
+            return CommandResult(
+                GraphState(state.items, edges),
+                [MemoryLifecycleEvent(type="edge.retracted", edge=existing_edge, cause_type="edge.retract")],
+            )
+        case _:  # pragma: no cover - defensive
+            raise TypeError(f"Unknown memory command: {command!r}")