npm - @smilintux/skmemory - Versions diffs - 0.5.0 → 0.7.2 - Mend

@smilintux/skmemory 0.5.0 → 0.7.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

package/.github/workflows/ci.yml +39 -3
package/.github/workflows/publish.yml +13 -6
package/AGENT_REFACTOR_CHANGES.md +192 -0
package/ARCHITECTURE.md +101 -19
package/CHANGELOG.md +153 -0
package/LICENSE +81 -68
package/MISSION.md +7 -0
package/README.md +419 -86
package/SKILL.md +197 -25
package/docker-compose.yml +15 -15
package/index.js +6 -5
package/openclaw-plugin/openclaw.plugin.json +10 -0
package/openclaw-plugin/src/index.ts +255 -0
package/openclaw-plugin/src/openclaw.plugin.json +10 -0
package/package.json +1 -1
package/pyproject.toml +29 -9
package/requirements.txt +10 -2
package/seeds/cloud9-opus.seed.json +7 -7
package/seeds/lumina-cloud9-breakthrough.seed.json +46 -0
package/seeds/lumina-cloud9-python-pypi.seed.json +46 -0
package/seeds/lumina-kingdom-founding.seed.json +47 -0
package/seeds/lumina-pma-signed.seed.json +46 -0
package/seeds/lumina-singular-achievement.seed.json +46 -0
package/seeds/lumina-skcapstone-conscious.seed.json +46 -0
package/seeds/plant-kingdom-journal.py +203 -0
package/seeds/plant-lumina-seeds.py +280 -0
package/skill.yaml +46 -0
package/skmemory/HA.md +296 -0
package/skmemory/__init__.py +12 -1
package/skmemory/agents.py +233 -0
package/skmemory/ai_client.py +40 -0
package/skmemory/anchor.py +4 -2
package/skmemory/backends/__init__.py +11 -4
package/skmemory/backends/file_backend.py +2 -1
package/skmemory/backends/skgraph_backend.py +608 -0
package/skmemory/backends/{qdrant_backend.py → skvector_backend.py} +99 -69
package/skmemory/backends/sqlite_backend.py +122 -51
package/skmemory/backends/vaulted_backend.py +286 -0
package/skmemory/cli.py +1238 -29
package/skmemory/config.py +173 -0
package/skmemory/context_loader.py +335 -0
package/skmemory/endpoint_selector.py +386 -0
package/skmemory/fortress.py +685 -0
package/skmemory/graph_queries.py +238 -0
package/skmemory/importers/__init__.py +9 -1
package/skmemory/importers/telegram.py +351 -43
package/skmemory/importers/telegram_api.py +488 -0
package/skmemory/journal.py +4 -2
package/skmemory/lovenote.py +4 -2
package/skmemory/mcp_server.py +706 -0
package/skmemory/models.py +41 -0
package/skmemory/openclaw.py +8 -8
package/skmemory/predictive.py +232 -0
package/skmemory/promotion.py +524 -0
package/skmemory/register.py +454 -0
package/skmemory/register_mcp.py +197 -0
package/skmemory/ritual.py +121 -47
package/skmemory/seeds.py +257 -8
package/skmemory/setup_wizard.py +920 -0
package/skmemory/sharing.py +402 -0
package/skmemory/soul.py +71 -20
package/skmemory/steelman.py +250 -263
package/skmemory/store.py +271 -60
package/skmemory/vault.py +228 -0
package/tests/integration/__init__.py +0 -0
package/tests/integration/conftest.py +233 -0
package/tests/integration/test_cross_backend.py +355 -0
package/tests/integration/test_skgraph_live.py +424 -0
package/tests/integration/test_skvector_live.py +369 -0
package/tests/test_backup_rotation.py +327 -0
package/tests/test_cli.py +6 -6
package/tests/test_endpoint_selector.py +801 -0
package/tests/test_fortress.py +255 -0
package/tests/test_fortress_hardening.py +444 -0
package/tests/test_openclaw.py +5 -2
package/tests/test_predictive.py +237 -0
package/tests/test_promotion.py +340 -0
package/tests/test_ritual.py +4 -4
package/tests/test_seeds.py +96 -0
package/tests/test_setup.py +835 -0
package/tests/test_sharing.py +250 -0
package/tests/test_skgraph_backend.py +667 -0
package/tests/test_skvector_backend.py +326 -0
package/tests/test_steelman.py +5 -5
package/tests/test_store_graph_integration.py +245 -0
package/tests/test_vault.py +186 -0
package/skmemory/backends/falkordb_backend.py +0 -310

package/skmemory/endpoint_selector.py ADDED Viewed

@@ -0,0 +1,386 @@
+"""
+SKMemory Endpoint Selector — HA routing for SKVector and SKGraph backends.
+Discovers multiple backend endpoints (via config or heartbeat mesh),
+probes their latency, selects the fastest healthy one, and fails over
+automatically.  No background threads — probing is on-demand with a
+TTL cache.
+Design principles:
+    - Selector picks a URL, backends stay unchanged
+    - On-demand probing with TTL cache (no background threads)
+    - Config endpoints take precedence over heartbeat discovery
+    - Graceful degradation everywhere
+    - Backward compatible: single-URL configs work unchanged
+"""
+from __future__ import annotations
+import json
+import logging
+import socket
+import time
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Optional
+from urllib.parse import urlparse
+from pydantic import BaseModel, Field
+logger = logging.getLogger("skmemory.endpoint_selector")
+# ---------------------------------------------------------------------------
+# Models
+# ---------------------------------------------------------------------------
+class Endpoint(BaseModel):
+    """A single backend endpoint with health and latency tracking."""
+    url: str
+    role: str = "primary"           # primary | replica
+    tailscale_ip: str = ""          # optional, for display
+    latency_ms: float = -1.0        # -1 = not yet probed
+    healthy: bool = True
+    last_checked: str = ""          # ISO timestamp
+    fail_count: int = 0
+class RoutingConfig(BaseModel):
+    """Configuration for endpoint routing behavior."""
+    strategy: str = "failover"      # failover | latency | local-first | read-local-write-primary
+    probe_interval_seconds: int = 30
+    probe_timeout_seconds: int = 3
+    max_fail_count: int = 3         # mark unhealthy after N consecutive failures
+    recovery_interval_seconds: int = 60  # re-check unhealthy endpoints
+# ---------------------------------------------------------------------------
+# EndpointSelector
+# ---------------------------------------------------------------------------
+class EndpointSelector:
+    """Routes requests to the best available backend endpoint.
+    Sits between config resolution and backend construction — picks the
+    best URL, then the caller creates backends normally with that URL.
+    Args:
+        skvector_endpoints: List of SKVector endpoint dicts or Endpoint objects.
+        skgraph_endpoints: List of SKGraph endpoint dicts or Endpoint objects.
+        config: Routing configuration.
+    """
+    def __init__(
+        self,
+        skvector_endpoints: Optional[list[dict | Endpoint]] = None,
+        skgraph_endpoints: Optional[list[dict | Endpoint]] = None,
+        config: Optional[RoutingConfig] = None,
+    ) -> None:
+        self._config = config or RoutingConfig()
+        self._skvector: list[Endpoint] = self._normalize(skvector_endpoints or [])
+        self._skgraph: list[Endpoint] = self._normalize(skgraph_endpoints or [])
+        self._last_probe_time: float = 0.0
+    @staticmethod
+    def _normalize(endpoints: list[dict | Endpoint]) -> list[Endpoint]:
+        """Convert dicts/Endpoints into a uniform list of Endpoint objects."""
+        result: list[Endpoint] = []
+        for ep in endpoints:
+            if isinstance(ep, Endpoint):
+                result.append(ep)
+            elif isinstance(ep, dict):
+                result.append(Endpoint(**ep))
+            else:
+                # Try pydantic model with .url attribute (EndpointConfig)
+                try:
+                    result.append(Endpoint(
+                        url=ep.url,
+                        role=getattr(ep, "role", "primary"),
+                        tailscale_ip=getattr(ep, "tailscale_ip", ""),
+                    ))
+                except AttributeError:
+                    logger.warning("Cannot normalize endpoint: %s", ep)
+        return result
+    # -------------------------------------------------------------------
+    # Core selection
+    # -------------------------------------------------------------------
+    def select_skvector(self, for_write: bool = False) -> Optional[Endpoint]:
+        """Select the best SKVector endpoint.
+        Args:
+            for_write: If True and strategy is read-local-write-primary,
+                       returns only primary endpoints.
+        Returns:
+            Best Endpoint or None if all unhealthy.
+        """
+        self._maybe_probe()
+        return self._select(self._skvector, for_write)
+    def select_skgraph(self, for_write: bool = False) -> Optional[Endpoint]:
+        """Select the best SKGraph endpoint.
+        Args:
+            for_write: If True and strategy is read-local-write-primary,
+                       returns only primary endpoints.
+        Returns:
+            Best Endpoint or None if all unhealthy.
+        """
+        self._maybe_probe()
+        return self._select(self._skgraph, for_write)
+    def _select(self, endpoints: list[Endpoint], for_write: bool) -> Optional[Endpoint]:
+        """Apply the routing strategy to pick the best endpoint."""
+        if not endpoints:
+            return None
+        strategy = self._config.strategy
+        if strategy == "read-local-write-primary" and for_write:
+            candidates = [ep for ep in endpoints if ep.healthy and ep.role == "primary"]
+        else:
+            candidates = [ep for ep in endpoints if ep.healthy]
+        if not candidates:
+            return None
+        if strategy == "failover":
+            return candidates[0]
+        if strategy == "latency":
+            probed = [ep for ep in candidates if ep.latency_ms >= 0]
+            if probed:
+                return min(probed, key=lambda e: e.latency_ms)
+            return candidates[0]
+        if strategy == "local-first":
+            for ep in candidates:
+                parsed = urlparse(ep.url)
+                host = parsed.hostname or ""
+                if host in ("localhost", "127.0.0.1", "::1"):
+                    return ep
+            # Fall back to lowest latency
+            probed = [ep for ep in candidates if ep.latency_ms >= 0]
+            if probed:
+                return min(probed, key=lambda e: e.latency_ms)
+            return candidates[0]
+        if strategy == "read-local-write-primary":
+            if for_write:
+                # Already filtered to primary above
+                return candidates[0] if candidates else None
+            # Reads: prefer local, then lowest latency
+            for ep in candidates:
+                parsed = urlparse(ep.url)
+                host = parsed.hostname or ""
+                if host in ("localhost", "127.0.0.1", "::1"):
+                    return ep
+            probed = [ep for ep in candidates if ep.latency_ms >= 0]
+            if probed:
+                return min(probed, key=lambda e: e.latency_ms)
+            return candidates[0]
+        # Unknown strategy, fall back to first healthy
+        return candidates[0]
+    # -------------------------------------------------------------------
+    # Health probing
+    # -------------------------------------------------------------------
+    def _maybe_probe(self) -> None:
+        """Probe if results are stale (older than probe_interval_seconds)."""
+        now = time.monotonic()
+        if now - self._last_probe_time >= self._config.probe_interval_seconds:
+            self.probe_all()
+    def probe_all(self) -> dict:
+        """Probe all endpoints and return results summary.
+        Returns:
+            Dict with skvector and skgraph probe results.
+        """
+        results = {
+            "skvector": [self.probe_endpoint(ep) for ep in self._skvector],
+            "skgraph": [self.probe_endpoint(ep) for ep in self._skgraph],
+        }
+        self._last_probe_time = time.monotonic()
+        return results
+    def probe_endpoint(self, endpoint: Endpoint) -> Endpoint:
+        """Probe a single endpoint's TCP connectivity and measure latency.
+        Updates the endpoint in-place and returns it.
+        Args:
+            endpoint: The endpoint to probe.
+        Returns:
+            The same Endpoint, updated with latency/health status.
+        """
+        parsed = urlparse(endpoint.url)
+        host = parsed.hostname or "localhost"
+        port = parsed.port
+        if port is None:
+            # Infer default ports from scheme
+            if parsed.scheme in ("redis", "rediss"):
+                port = 6379
+            elif parsed.scheme == "https":
+                port = 443
+            else:
+                port = 80
+        try:
+            start = time.monotonic()
+            sock = socket.create_connection(
+                (host, port),
+                timeout=self._config.probe_timeout_seconds,
+            )
+            elapsed_ms = (time.monotonic() - start) * 1000
+            sock.close()
+            endpoint.latency_ms = round(elapsed_ms, 2)
+            endpoint.fail_count = 0
+            endpoint.healthy = True
+        except (OSError, socket.timeout):
+            endpoint.fail_count += 1
+            endpoint.latency_ms = -1.0
+            if endpoint.fail_count >= self._config.max_fail_count:
+                endpoint.healthy = False
+        endpoint.last_checked = datetime.now(timezone.utc).isoformat()
+        return endpoint
+    def mark_unhealthy(self, url: str) -> None:
+        """Mark an endpoint as unhealthy by URL.
+        Called externally when a backend operation fails, so the next
+        selection picks a different endpoint.
+        Args:
+            url: The URL of the endpoint to mark.
+        """
+        for ep in self._skvector + self._skgraph:
+            if ep.url == url:
+                ep.fail_count = self._config.max_fail_count
+                ep.healthy = False
+                ep.last_checked = datetime.now(timezone.utc).isoformat()
+    # -------------------------------------------------------------------
+    # Heartbeat mesh discovery
+    # -------------------------------------------------------------------
+    def discover_from_heartbeats(self, heartbeat_dir: Optional[Path] = None) -> None:
+        """Discover backend endpoints from heartbeat mesh files.
+        Reads heartbeat JSON files and looks for a ``services`` field
+        containing advertised backend services.  Discovered endpoints are
+        merged with existing ones (config takes precedence).
+        Args:
+            heartbeat_dir: Path to heartbeat directory.
+                           Defaults to ``~/.skcapstone/heartbeats/``.
+        """
+        if heartbeat_dir is None:
+            from .agents import AGENTS_BASE_DIR
+            # heartbeats/ is a sibling of agents/ under the skcapstone root
+            heartbeat_dir = AGENTS_BASE_DIR.parent / "heartbeats"
+        if not heartbeat_dir.is_dir():
+            logger.debug("Heartbeat directory not found: %s", heartbeat_dir)
+            return
+        existing_skvector_urls = {ep.url for ep in self._skvector}
+        existing_skgraph_urls = {ep.url for ep in self._skgraph}
+        for f in sorted(heartbeat_dir.glob("*.json")):
+            if f.name.endswith(".tmp"):
+                continue
+            try:
+                data = json.loads(f.read_text(encoding="utf-8"))
+            except (json.JSONDecodeError, OSError) as exc:
+                logger.debug("Cannot read heartbeat %s: %s", f.name, exc)
+                continue
+            services = data.get("services", [])
+            if not services:
+                continue
+            hostname = data.get("hostname", "")
+            tailscale_ip = data.get("tailscale_ip", "")
+            # Prefer tailscale_ip, fall back to hostname
+            host = tailscale_ip or hostname
+            if not host:
+                continue
+            for svc in services:
+                name = svc.get("name", "")
+                port = svc.get("port", 0)
+                protocol = svc.get("protocol", "http")
+                if not name or not port:
+                    continue
+                url = f"{protocol}://{host}:{port}"
+                if name == "skvector" and url not in existing_skvector_urls:
+                    self._skvector.append(Endpoint(
+                        url=url,
+                        role="replica",
+                        tailscale_ip=tailscale_ip,
+                    ))
+                    existing_skvector_urls.add(url)
+                    logger.info("Discovered SKVector endpoint: %s", url)
+                elif name == "skgraph" and url not in existing_skgraph_urls:
+                    self._skgraph.append(Endpoint(
+                        url=url,
+                        role="replica",
+                        tailscale_ip=tailscale_ip,
+                    ))
+                    existing_skgraph_urls.add(url)
+                    logger.info("Discovered SKGraph endpoint: %s", url)
+    # -------------------------------------------------------------------
+    # Status reporting
+    # -------------------------------------------------------------------
+    def status(self) -> dict:
+        """Return a status report of all endpoints.
+        Returns:
+            Dict with strategy, endpoint lists, and probe staleness.
+        """
+        now = time.monotonic()
+        stale_seconds = now - self._last_probe_time if self._last_probe_time > 0 else -1
+        return {
+            "strategy": self._config.strategy,
+            "probe_interval_seconds": self._config.probe_interval_seconds,
+            "last_probe_age_seconds": round(stale_seconds, 1),
+            "skvector_endpoints": [ep.model_dump() for ep in self._skvector],
+            "skgraph_endpoints": [ep.model_dump() for ep in self._skgraph],
+        }
+    @property
+    def skvector_endpoints(self) -> list[Endpoint]:
+        """Access the SKVector endpoint list."""
+        return self._skvector
+    @property
+    def skgraph_endpoints(self) -> list[Endpoint]:
+        """Access the SKGraph endpoint list."""
+        return self._skgraph
+    @property
+    def config(self) -> RoutingConfig:
+        """Access the routing configuration."""
+        return self._config