PyPI - memplex - Versions diffs - 3.2.0__py3-none-any.whl - Mend

memplex 3.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

memnex/__init__.py +31 -0
memnex/__main__.py +6 -0
memnex/_plugin/.claude-plugin/plugin.json +24 -0
memnex/_plugin/.mcp.json +9 -0
memnex/_plugin/__init__.py +0 -0
memnex/_plugin/hooks/hooks.json +43 -0
memnex/_plugin/scripts/hook-runner.py +166 -0
memnex/_plugin/skills/mem-explore/SKILL.md +83 -0
memnex/_plugin/skills/mem-manage/SKILL.md +92 -0
memnex/_plugin/skills/mem-search/SKILL.md +85 -0
memnex/_plugin/skills/mem-write/SKILL.md +78 -0
memnex/adapters/__init__.py +14 -0
memnex/adapters/claude_skill.py +169 -0
memnex/adapters/cli.py +525 -0
memnex/adapters/http_api.py +314 -0
memnex/adapters/mcp_server.py +448 -0
memnex/compaction.py +563 -0
memnex/config.py +366 -0
memnex/core/__init__.py +13 -0
memnex/core/associator/__init__.py +8 -0
memnex/core/associator/domain_classifier.py +75 -0
memnex/core/associator/entity_aligner.py +127 -0
memnex/core/associator/ref_linker.py +197 -0
memnex/core/associator/term_mapper.py +77 -0
memnex/core/dictionaries/__init__.py +50 -0
memnex/core/engine.py +667 -0
memnex/core/extractors/__init__.py +15 -0
memnex/core/extractors/docx.py +97 -0
memnex/core/extractors/image.py +233 -0
memnex/core/extractors/markdown.py +139 -0
memnex/core/extractors/pdf.py +133 -0
memnex/core/extractors/vision_mapper.py +131 -0
memnex/core/handlers/__init__.py +7 -0
memnex/core/handlers/clipboard.py +40 -0
memnex/core/handlers/file_handler.py +62 -0
memnex/core/handlers/url_handler.py +132 -0
memnex/llm/__init__.py +25 -0
memnex/llm/enhancer.py +226 -0
memnex/llm/fallback_chain.py +87 -0
memnex/llm/injection_guard.py +178 -0
memnex/llm/provider.py +130 -0
memnex/llm/providers/__init__.py +22 -0
memnex/llm/providers/anthropic.py +135 -0
memnex/llm/providers/local.py +135 -0
memnex/llm/providers/rule_based.py +68 -0
memnex/llm/sanitizer.py +67 -0
memnex/models/__init__.py +68 -0
memnex/models/feedback.py +42 -0
memnex/models/graph.py +33 -0
memnex/models/memory.py +102 -0
memnex/models/misc.py +185 -0
memnex/models/paragraph.py +45 -0
memnex/models/search.py +51 -0
memnex/models/source.py +23 -0
memnex/models/task.py +62 -0
memnex/processing/__init__.py +1 -0
memnex/processing/graph_builder.py +278 -0
memnex/processing/merger/__init__.py +6 -0
memnex/processing/merger/confidence_calculator.py +127 -0
memnex/processing/merger/conflict_resolver.py +116 -0
memnex/retrieval/__init__.py +1 -0
memnex/retrieval/dedup.py +386 -0
memnex/retrieval/embedding.py +289 -0
memnex/retrieval/reranker.py +299 -0
memnex/service.py +902 -0
memnex/storage/__init__.py +65 -0
memnex/storage/base.py +132 -0
memnex/storage/changelog.py +106 -0
memnex/storage/feedback.py +486 -0
memnex/storage/lite/__init__.py +5 -0
memnex/storage/lite/store.py +606 -0
memnex/storage/vector.py +265 -0
memnex/wiki/__init__.py +11 -0
memnex/wiki/community.py +221 -0
memnex/wiki/compiler.py +545 -0
memnex/wiki/generator.py +270 -0
memnex/wiki/search.py +282 -0
memnex/worker.py +412 -0
memplex-3.2.0.dist-info/METADATA +37 -0
memplex-3.2.0.dist-info/RECORD +83 -0
memplex-3.2.0.dist-info/WHEEL +5 -0
memplex-3.2.0.dist-info/entry_points.txt +2 -0
memplex-3.2.0.dist-info/top_level.txt +1 -0

memnex/storage/lite/store.py ADDED Viewed

@@ -0,0 +1,606 @@
+"""LiteMemoryStore -- in-memory + JSON persistence backend.
+Data paths::
+    ~/.memnex/memory.json      Functions + graph edges
+    ~/.memnex/changelog.json   Changelog events (via ChangelogStore)
+All data is held in memory and flushed to JSON on every write.
+Atomic replacement (write-to-temp + rename) guards against partial writes.
+Single-thread assumption: optimistic lock is skipped.
+"""
+from __future__ import annotations
+import copy
+import json
+import logging
+import math
+import tempfile
+from datetime import datetime
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+from memnex.models import (
+    BatchResult,
+    ChangelogEvent,
+    FieldValue,
+    Function,
+    GraphData,
+    GraphEdge,
+    MergeResult,
+    Observation,
+    SearchFilters,
+    SearchResult,
+    SourceDocument,
+    SourceType,
+)
+from memnex.storage.changelog import ChangelogStore
+logger = logging.getLogger(__name__)
+# ── Serialization helpers ────────────────────────────────────────────
+def _json_serializer(obj: Any) -> Any:
+    """Default serializer for ``json.dumps``."""
+    if isinstance(obj, datetime):
+        return obj.isoformat()
+    if isinstance(obj, Path):
+        return str(obj)
+    if isinstance(obj, SourceType):
+        return obj.value
+    raise TypeError(f"Object of type {type(obj).__name__} is not JSON serializable")
+def _serialize_field_value(fv: FieldValue) -> dict:
+    return {
+        "desc": fv.desc,
+        "sources": fv.sources,
+        "source_method": fv.source_method,
+        "weight": fv.weight,
+        "observation": fv.observation,
+        "created_at": (
+            fv.created_at.isoformat() if isinstance(fv.created_at, datetime) else fv.created_at
+        ),
+        "status": fv.status,
+    }
+def _deserialize_field_value(d: dict) -> FieldValue:
+    created_at = d.get("created_at")
+    if isinstance(created_at, str):
+        created_at = datetime.fromisoformat(created_at)
+    return FieldValue(
+        desc=d["desc"],
+        sources=d.get("sources", []),
+        source_method=d.get("source_method", "rule_based"),
+        weight=d.get("weight", 1.0),
+        observation=d.get("observation"),
+        created_at=created_at,
+        status=d.get("status", "active"),
+    )
+def _serialize_function(func: Function) -> dict:
+    return {
+        "id": func.id,
+        "memory_type": func.memory_type,
+        "name": func.name,
+        "name_normalized": func.name_normalized,
+        "domain": func.domain,
+        "confidence": func.confidence,
+        "source_type": func.source_type.value if isinstance(func.source_type, SourceType) else func.source_type,
+        "owner": func.owner,
+        "version": func.version,
+        "created_at": func.created_at,
+        "updated_at": func.updated_at,
+        "origin_session": func.origin_session,
+        "access_count": func.access_count,
+        "last_accessed_at": func.last_accessed_at,
+        "source_paragraphs": func.source_paragraphs,
+        "needs_review": func.needs_review,
+        "needs_review_until": func.needs_review_until,
+        "content_hash": func.content_hash,
+        "trigger": [_serialize_field_value(fv) for fv in func.trigger],
+        "condition": [_serialize_field_value(fv) for fv in func.condition],
+        "action": [_serialize_field_value(fv) for fv in func.action],
+        "benefit": [_serialize_field_value(fv) for fv in func.benefit],
+        "attributes": func.attributes,
+        "cross_references": func.cross_references,
+        "priority_from_source": func.priority_from_source,
+        "source_authority": func.source_authority,
+    }
+def _deserialize_function(d: dict) -> Function:
+    source_type = d.get("source_type", "wiki")
+    if isinstance(source_type, str):
+        try:
+            source_type = SourceType(source_type)
+        except ValueError:
+            source_type = SourceType.WIKI
+    return Function(
+        id=d["id"],
+        memory_type=d.get("memory_type", "function"),
+        name=d.get("name", ""),
+        name_normalized=d.get("name_normalized", ""),
+        domain=d.get("domain"),
+        confidence=d.get("confidence", 1.0),
+        source_type=source_type,
+        owner=d.get("owner"),
+        version=d.get("version", 1),
+        created_at=d.get("created_at"),
+        updated_at=d.get("updated_at"),
+        origin_session=d.get("origin_session"),
+        access_count=d.get("access_count", 0),
+        last_accessed_at=d.get("last_accessed_at"),
+        source_paragraphs=d.get("source_paragraphs", []),
+        needs_review=d.get("needs_review", False),
+        needs_review_until=d.get("needs_review_until"),
+        content_hash=d.get("content_hash"),
+        trigger=[_deserialize_field_value(fv) for fv in d.get("trigger", [])],
+        condition=[_deserialize_field_value(fv) for fv in d.get("condition", [])],
+        action=[_deserialize_field_value(fv) for fv in d.get("action", [])],
+        benefit=[_deserialize_field_value(fv) for fv in d.get("benefit", [])],
+        attributes=d.get("attributes", {}),
+        cross_references=d.get("cross_references", []),
+        priority_from_source=d.get("priority_from_source"),
+        source_authority=d.get("source_authority"),
+    )
+def _serialize_edge(edge: GraphEdge) -> dict:
+    return {
+        "source": edge.source,
+        "target": edge.target,
+        "edge_type": edge.edge_type,
+        "weight": edge.weight,
+        "evidence": edge.evidence,
+        "created_at": (
+            edge.created_at.isoformat() if isinstance(edge.created_at, datetime) else edge.created_at
+        ),
+    }
+def _deserialize_edge(d: dict) -> GraphEdge:
+    created_at = d.get("created_at")
+    if isinstance(created_at, str):
+        created_at = datetime.fromisoformat(created_at)
+    return GraphEdge(
+        source=d["source"],
+        target=d["target"],
+        edge_type=d["edge_type"],
+        weight=d.get("weight", 1.0),
+        evidence=d.get("evidence", []),
+        created_at=created_at,
+    )
+# ── Merge helpers ────────────────────────────────────────────────────
+def _merge_field_values(
+    existing: List[FieldValue],
+    incoming: List[FieldValue],
+) -> List[FieldValue]:
+    """Merge incoming FieldValues into existing.  Duplicates (by desc) are
+    skipped; weight and observation are taken from the newer entry.
+    """
+    seen = {fv.desc for fv in existing}
+    merged = list(existing)
+    for fv in incoming:
+        if fv.desc not in seen:
+            merged.append(fv)
+            seen.add(fv.desc)
+    return merged
+def _normalize_name(name: str) -> str:
+    """Produce a normalised form for dedup matching."""
+    return name.strip().lower()
+# ── LiteMemoryStore ──────────────────────────────────────────────────
+class LiteMemoryStore:
+    """InMemory + JSON persistence backend.
+    Parameters
+    ----------
+    path:
+        Root JSON file path.  Defaults to ``~/.memnex/memory.json``.
+    """
+    def __init__(self, path: Optional[Path] = None) -> None:
+        self._path = path or Path("~/.memnex/memory.json").expanduser()
+        self._functions: Dict[str, Function] = {}
+        self._name_index: Dict[str, str] = {}  # name_normalized -> func_id
+        self._edges: List[GraphEdge] = []
+        self._observations: List[Observation] = []
+        self._changelog = ChangelogStore(
+            path=self._path.parent / "changelog.json"
+        )
+        self._load()
+    # ── Public: Write ───────────────────────────────────────────────
+    def add(self, func: Function, source: SourceDocument) -> None:
+        norm = _normalize_name(func.name_normalized or func.name)
+        existing_id = self._name_index.get(norm)
+        if existing_id and existing_id in self._functions:
+            existing = self._functions[existing_id]
+            # Merge FieldValues
+            existing.trigger = _merge_field_values(existing.trigger, func.trigger)
+            existing.condition = _merge_field_values(existing.condition, func.condition)
+            existing.action = _merge_field_values(existing.action, func.action)
+            existing.benefit = _merge_field_values(existing.benefit, func.benefit)
+            # Merge source paragraphs
+            for sp in func.source_paragraphs:
+                if sp not in existing.source_paragraphs:
+                    existing.source_paragraphs.append(sp)
+            existing.updated_at = datetime.utcnow().isoformat()
+            existing.version += 1
+            self._changelog.append(ChangelogEvent(
+                func_id=existing.id,
+                timestamp=datetime.now(),
+                event_type="updated",
+                description=f"Merged fields from source",
+                source=getattr(source, "source_path", None) or getattr(source, "url", "") or "",
+                actor="system",
+            ))
+        else:
+            self._functions[func.id] = func
+            self._name_index[norm] = func.id
+            self._changelog.append(ChangelogEvent(
+                func_id=func.id,
+                timestamp=datetime.now(),
+                event_type="created",
+                description=f"Created function: {func.name}",
+                source=getattr(source, "source_path", None) or getattr(source, "url", "") or "",
+                actor="system",
+            ))
+        self._save()
+    def add_batch(
+        self,
+        funcs: List[Function],
+        sources: List[SourceDocument],
+    ) -> BatchResult:
+        result = BatchResult(total=len(funcs))
+        for func, src in zip(funcs, sources):
+            try:
+                self.add(func, src)
+                result.succeeded += 1
+            except Exception as exc:
+                result.failed_items.append({
+                    "func_id": func.id,
+                    "name": func.name,
+                    "error": str(exc),
+                })
+        return result
+    def add_observation(self, observation: Observation) -> None:
+        self._observations.append(observation)
+    def increment_access(self, func_id: str) -> None:
+        func = self._functions.get(func_id)
+        if func is None:
+            return
+        func.access_count += 1
+        func.last_accessed_at = datetime.utcnow().isoformat()
+        self._save()
+    # ── Public: Retrieval ───────────────────────────────────────────
+    def vector_search(self, text: str, top_k: int = 5) -> List[SearchResult]:
+        """Basic TF-IDF cosine similarity search over Function text."""
+        query_words = set(text.lower().split())
+        scored: List[tuple] = []
+        for func in self._functions.values():
+            func_text = self._function_to_search_text(func)
+            func_words = set(func_text.lower().split())
+            if not query_words or not func_words:
+                score = 0.0
+            else:
+                intersection = query_words & func_words
+                union = query_words | func_words
+                score = len(intersection) / (len(union) + 1e-10)
+            scored.append((score, func))
+        scored.sort(key=lambda x: x[0], reverse=True)
+        results: List[SearchResult] = []
+        for score, func in scored[:top_k]:
+            if score <= 0:
+                continue
+            results.append(SearchResult(
+                func_id=func.id,
+                name=func.name,
+                domain=func.domain or "",
+                relevance_score=score,
+                summary=self._function_to_search_text(func),
+                source_type=func.source_type,
+                created_at=func.created_at,
+                updated_at=func.updated_at,
+                origin=func.origin_session or "",
+            ))
+        return results
+    def fts_search(self, text: str, top_k: int = 10) -> List[SearchResult]:
+        """Keyword matching search."""
+        query_lower = text.lower()
+        scored: List[tuple] = []
+        for func in self._functions.values():
+            func_text = self._function_to_search_text(func).lower()
+            count = func_text.count(query_lower)
+            if count > 0:
+                scored.append((count, func))
+        scored.sort(key=lambda x: x[0], reverse=True)
+        results: List[SearchResult] = []
+        for count, func in scored[:top_k]:
+            results.append(SearchResult(
+                func_id=func.id,
+                name=func.name,
+                domain=func.domain or "",
+                relevance_score=min(count / 5.0, 1.0),
+                summary=self._function_to_search_text(func),
+                source_type=func.source_type,
+                created_at=func.created_at,
+                updated_at=func.updated_at,
+                origin=func.origin_session or "",
+            ))
+        return results
+    def filter(self, filters: SearchFilters) -> List[Function]:
+        results: List[Function] = []
+        for func in self._functions.values():
+            if not self._matches_filter(func, filters):
+                continue
+            results.append(func)
+        return results
+    # ── Public: Read ────────────────────────────────────────────────
+    def get(self, func_id: str) -> Optional[Function]:
+        return self._functions.get(func_id)
+    def get_neighbors(
+        self,
+        func_id: str,
+        edge_types: Optional[List[str]] = None,
+        max_hops: int = 1,
+    ) -> List[Function]:
+        if max_hops < 1:
+            return []
+        # BFS
+        visited: set = {func_id}
+        current_level = {func_id}
+        neighbor_ids: set = set()
+        for _ in range(max_hops):
+            next_level: set = set()
+            for fid in current_level:
+                for edge in self._edges:
+                    if edge_types and edge.edge_type not in edge_types:
+                        continue
+                    if edge.source == fid and edge.target not in visited:
+                        next_level.add(edge.target)
+                    elif edge.target == fid and edge.source not in visited:
+                        next_level.add(edge.source)
+            visited |= next_level
+            neighbor_ids |= next_level
+            current_level = next_level
+        return [
+            self._functions[fid]
+            for fid in neighbor_ids
+            if fid in self._functions
+        ]
+    def get_graph(self, func_ids: Optional[List[str]] = None) -> GraphData:
+        if func_ids is None:
+            nodes = list(self._functions.values())
+            edges = list(self._edges)
+        else:
+            id_set = set(func_ids)
+            nodes = [
+                self._functions[fid]
+                for fid in func_ids
+                if fid in self._functions
+            ]
+            edges = [
+                e for e in self._edges
+                if e.source in id_set or e.target in id_set
+            ]
+        return GraphData(nodes=nodes, edges=edges)
+    def get_timeline(self, func_id: str, limit: int = 20) -> List[ChangelogEvent]:
+        return self._changelog.get_timeline(func_id, limit)
+    def list_functions(
+        self,
+        offset: int = 0,
+        limit: int = 1000,
+        owner: Optional[str] = None,
+    ) -> List[Function]:
+        funcs = list(self._functions.values())
+        if owner is not None:
+            funcs = [f for f in funcs if f.owner == owner]
+        return funcs[offset : offset + limit]
+    # ── Public: Delete / Merge / Clear ──────────────────────────────
+    def delete(self, func_id: str) -> None:
+        self._functions.pop(func_id, None)
+        # Remove from name index
+        to_remove = [
+            norm for norm, fid in self._name_index.items() if fid == func_id
+        ]
+        for norm in to_remove:
+            del self._name_index[norm]
+        # Remove edges referencing this function
+        self._edges = [
+            e for e in self._edges
+            if e.source != func_id and e.target != func_id
+        ]
+        self._save()
+    def merge(self, sub_graph: GraphData) -> MergeResult:
+        result = MergeResult(merged=True)
+        # Merge nodes
+        for node in sub_graph.nodes:
+            func_id = getattr(node, "id", None)
+            if not func_id:
+                continue
+            if func_id in self._functions:
+                existing = self._functions[func_id]
+                if hasattr(node, "trigger"):
+                    existing.trigger = _merge_field_values(
+                        existing.trigger, node.trigger
+                    )
+                if hasattr(node, "condition"):
+                    existing.condition = _merge_field_values(
+                        existing.condition, node.condition
+                    )
+                if hasattr(node, "action"):
+                    existing.action = _merge_field_values(
+                        existing.action, node.action
+                    )
+                if hasattr(node, "benefit"):
+                    existing.benefit = _merge_field_values(
+                        existing.benefit, node.benefit
+                    )
+                existing.updated_at = datetime.utcnow().isoformat()
+                existing.version += 1
+                result.updated_functions += 1
+            else:
+                self._functions[func_id] = node
+                norm = _normalize_name(
+                    getattr(node, "name_normalized", "")
+                    or getattr(node, "name", "")
+                )
+                if norm:
+                    self._name_index[norm] = func_id
+                result.new_functions += 1
+        # Merge edges (skip duplicates)
+        existing_edge_keys = {
+            (e.source, e.target, e.edge_type) for e in self._edges
+        }
+        for edge in sub_graph.edges:
+            key = (edge.source, edge.target, edge.edge_type)
+            if key not in existing_edge_keys:
+                self._edges.append(edge)
+                existing_edge_keys.add(key)
+                result.new_edges += 1
+        self._save()
+        return result
+    def clear(self) -> None:
+        self._functions.clear()
+        self._name_index.clear()
+        self._edges.clear()
+        self._observations.clear()
+        self._changelog.clear()
+        self._save()
+    # ── Persistence ─────────────────────────────────────────────────
+    def _save(self) -> None:
+        self._path.parent.mkdir(parents=True, exist_ok=True)
+        data = {
+            "functions": [_serialize_function(f) for f in self._functions.values()],
+            "edges": [_serialize_edge(e) for e in self._edges],
+        }
+        tmp_fd, tmp_path = tempfile.mkstemp(
+            dir=str(self._path.parent), suffix=".tmp"
+        )
+        try:
+            with open(tmp_fd, "w", encoding="utf-8") as fh:
+                json.dump(data, fh, default=_json_serializer, ensure_ascii=False, indent=2)
+            Path(tmp_path).replace(self._path)
+        except Exception:
+            Path(tmp_path).unlink(missing_ok=True)
+            raise
+    def _load(self) -> None:
+        if not self._path.exists():
+            return
+        try:
+            raw = json.loads(self._path.read_text(encoding="utf-8"))
+        except Exception:
+            logger.warning("Failed to load memory from %s", self._path)
+            return
+        for fd in raw.get("functions", []):
+            func = _deserialize_function(fd)
+            self._functions[func.id] = func
+            norm = _normalize_name(func.name_normalized or func.name)
+            if norm:
+                self._name_index[norm] = func.id
+        for ed in raw.get("edges", []):
+            self._edges.append(_deserialize_edge(ed))
+    # ── Internal helpers ────────────────────────────────────────────
+    @staticmethod
+    def _function_to_search_text(func: Function) -> str:
+        parts = [func.name, func.domain or ""]
+        for fv in func.trigger:
+            parts.append(fv.desc)
+        for fv in func.action:
+            parts.append(fv.desc)
+        for fv in func.benefit:
+            parts.append(fv.desc)
+        return " ".join(parts)
+    @staticmethod
+    def _matches_filter(func: Function, filters: SearchFilters) -> bool:
+        if filters.domain and func.domain not in filters.domain:
+            return False
+        if (
+            filters.source_type
+            and func.source_type not in filters.source_type
+        ):
+            return False
+        if filters.confidence_min is not None:
+            if func.confidence < filters.confidence_min:
+                return False
+        if filters.owner is not None and func.owner != filters.owner:
+            return False
+        if filters.needs_review is not None:
+            if func.needs_review != filters.needs_review:
+                return False
+        # Datetime filters: compare ISO strings lexicographically
+        if filters.updated_after is not None:
+            after = (
+                filters.updated_after.isoformat()
+                if hasattr(filters.updated_after, "isoformat")
+                else str(filters.updated_after)
+            )
+            if func.updated_at and func.updated_at < after:
+                return False
+        if filters.updated_before is not None:
+            before = (
+                filters.updated_before.isoformat()
+                if hasattr(filters.updated_before, "isoformat")
+                else str(filters.updated_before)
+            )
+            if func.updated_at and func.updated_at > before:
+                return False
+        return True