PyPI - kailash - Versions diffs - 0.8.4__py3-none-any.whl → 0.8.6__py3-none-any.whl - Mend

kailash 0.8.4py3-none-any.whl → 0.8.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (99) hide show

kailash/__init__.py +5 -11
kailash/channels/__init__.py +2 -1
kailash/channels/mcp_channel.py +23 -4
kailash/cli/__init__.py +11 -1
kailash/cli/validate_imports.py +202 -0
kailash/cli/validation_audit.py +570 -0
kailash/core/actors/supervisor.py +1 -1
kailash/core/resilience/bulkhead.py +15 -5
kailash/core/resilience/circuit_breaker.py +74 -1
kailash/core/resilience/health_monitor.py +433 -33
kailash/edge/compliance.py +33 -0
kailash/edge/consistency.py +609 -0
kailash/edge/coordination/__init__.py +30 -0
kailash/edge/coordination/global_ordering.py +355 -0
kailash/edge/coordination/leader_election.py +217 -0
kailash/edge/coordination/partition_detector.py +296 -0
kailash/edge/coordination/raft.py +485 -0
kailash/edge/discovery.py +63 -1
kailash/edge/migration/__init__.py +19 -0
kailash/edge/migration/edge_migration_service.py +384 -0
kailash/edge/migration/edge_migrator.py +832 -0
kailash/edge/monitoring/__init__.py +21 -0
kailash/edge/monitoring/edge_monitor.py +736 -0
kailash/edge/prediction/__init__.py +10 -0
kailash/edge/prediction/predictive_warmer.py +591 -0
kailash/edge/resource/__init__.py +102 -0
kailash/edge/resource/cloud_integration.py +796 -0
kailash/edge/resource/cost_optimizer.py +949 -0
kailash/edge/resource/docker_integration.py +919 -0
kailash/edge/resource/kubernetes_integration.py +893 -0
kailash/edge/resource/platform_integration.py +913 -0
kailash/edge/resource/predictive_scaler.py +959 -0
kailash/edge/resource/resource_analyzer.py +824 -0
kailash/edge/resource/resource_pools.py +610 -0
kailash/integrations/dataflow_edge.py +261 -0
kailash/mcp_server/registry_integration.py +1 -1
kailash/mcp_server/server.py +351 -8
kailash/mcp_server/transports.py +305 -0
kailash/middleware/gateway/event_store.py +1 -0
kailash/monitoring/__init__.py +18 -0
kailash/monitoring/alerts.py +646 -0
kailash/monitoring/metrics.py +677 -0
kailash/nodes/__init__.py +2 -0
kailash/nodes/ai/semantic_memory.py +2 -2
kailash/nodes/base.py +622 -1
kailash/nodes/code/python.py +44 -3
kailash/nodes/data/async_sql.py +42 -20
kailash/nodes/edge/__init__.py +36 -0
kailash/nodes/edge/base.py +240 -0
kailash/nodes/edge/cloud_node.py +710 -0
kailash/nodes/edge/coordination.py +239 -0
kailash/nodes/edge/docker_node.py +825 -0
kailash/nodes/edge/edge_data.py +582 -0
kailash/nodes/edge/edge_migration_node.py +396 -0
kailash/nodes/edge/edge_monitoring_node.py +421 -0
kailash/nodes/edge/edge_state.py +673 -0
kailash/nodes/edge/edge_warming_node.py +393 -0
kailash/nodes/edge/kubernetes_node.py +652 -0
kailash/nodes/edge/platform_node.py +766 -0
kailash/nodes/edge/resource_analyzer_node.py +378 -0
kailash/nodes/edge/resource_optimizer_node.py +501 -0
kailash/nodes/edge/resource_scaler_node.py +397 -0
kailash/nodes/governance.py +410 -0
kailash/nodes/ports.py +676 -0
kailash/nodes/rag/registry.py +1 -1
kailash/nodes/transaction/distributed_transaction_manager.py +48 -1
kailash/nodes/transaction/saga_state_storage.py +2 -1
kailash/nodes/validation.py +8 -8
kailash/runtime/local.py +374 -1
kailash/runtime/validation/__init__.py +12 -0
kailash/runtime/validation/connection_context.py +119 -0
kailash/runtime/validation/enhanced_error_formatter.py +202 -0
kailash/runtime/validation/error_categorizer.py +164 -0
kailash/runtime/validation/import_validator.py +446 -0
kailash/runtime/validation/metrics.py +380 -0
kailash/runtime/validation/performance.py +615 -0
kailash/runtime/validation/suggestion_engine.py +212 -0
kailash/testing/fixtures.py +2 -2
kailash/utils/data_paths.py +74 -0
kailash/workflow/builder.py +413 -8
kailash/workflow/contracts.py +418 -0
kailash/workflow/edge_infrastructure.py +369 -0
kailash/workflow/mermaid_visualizer.py +3 -1
kailash/workflow/migration.py +3 -3
kailash/workflow/templates.py +6 -6
kailash/workflow/type_inference.py +669 -0
kailash/workflow/validation.py +134 -3
{kailash-0.8.4.dist-info → kailash-0.8.6.dist-info}/METADATA +52 -34
{kailash-0.8.4.dist-info → kailash-0.8.6.dist-info}/RECORD +93 -42
kailash/nexus/__init__.py +0 -21
kailash/nexus/cli/__init__.py +0 -5
kailash/nexus/cli/__main__.py +0 -6
kailash/nexus/cli/main.py +0 -176
kailash/nexus/factory.py +0 -413
kailash/nexus/gateway.py +0 -545
{kailash-0.8.4.dist-info → kailash-0.8.6.dist-info}/WHEEL +0 -0
{kailash-0.8.4.dist-info → kailash-0.8.6.dist-info}/entry_points.txt +0 -0
{kailash-0.8.4.dist-info → kailash-0.8.6.dist-info}/licenses/LICENSE +0 -0
{kailash-0.8.4.dist-info → kailash-0.8.6.dist-info}/top_level.txt +0 -0

kailash/nodes/edge/edge_data.py ADDED Viewed

@@ -0,0 +1,582 @@
+"""Edge data node for distributed data management with consistency guarantees."""
+import asyncio
+import hashlib
+import json
+from datetime import UTC, datetime
+from enum import Enum
+from typing import Any, Dict, List, Optional, Set
+from kailash.edge.location import EdgeLocation
+from kailash.nodes.base import NodeParameter, register_node
+from .base import EdgeNode
+class ConsistencyModel(Enum):
+    """Data consistency models for edge operations."""
+    STRONG = "strong"  # 2PC - All replicas must acknowledge
+    EVENTUAL = "eventual"  # Async replication
+    CAUSAL = "causal"  # Causally consistent updates
+    BOUNDED_STALENESS = "bounded_staleness"  # Max staleness threshold
+class ReplicationStatus:
+    """Track replication status across edges."""
+    def __init__(self):
+        self.pending: Set[str] = set()
+        self.completed: Set[str] = set()
+        self.failed: Set[str] = set()
+        self.start_time = datetime.now(UTC)
+    @property
+    def is_complete(self) -> bool:
+        return len(self.pending) == 0
+    @property
+    def success_rate(self) -> float:
+        total = len(self.completed) + len(self.failed)
+        return len(self.completed) / total if total > 0 else 0.0
+@register_node()
+class EdgeDataNode(EdgeNode):
+    """Distributed data node with multi-edge replication and consistency.
+    Features:
+    - Multiple consistency models
+    - Automatic replication across edges
+    - Conflict resolution
+    - Compliance-aware data placement
+    """
+    def get_parameters(self) -> Dict[str, NodeParameter]:
+        """Get node parameters."""
+        return {
+            "action": NodeParameter(
+                name="action",
+                type=str,
+                default="read",
+                required=False,
+                description="Operation to perform (read|write|replicate|sync)",
+            ),
+            "key": NodeParameter(
+                name="key",
+                type=str,
+                required=False,
+                description="Data key for operations",
+            ),
+            "data": NodeParameter(
+                name="data", type=dict, required=False, description="Data to write"
+            ),
+            "target_edges": NodeParameter(
+                name="target_edges",
+                type=list,
+                required=False,
+                description="Target edges for replication",
+            ),
+            "keys": NodeParameter(
+                name="keys", type=list, required=False, description="Keys to sync"
+            ),
+            "consistency": NodeParameter(
+                name="consistency",
+                type=str,
+                default="eventual",
+                required=False,
+                description="Consistency model (strong|eventual|causal|bounded_staleness)",
+            ),
+            "replication_factor": NodeParameter(
+                name="replication_factor",
+                type=int,
+                default=3,
+                required=False,
+                description="Number of edge replicas to maintain",
+            ),
+            "staleness_threshold_ms": NodeParameter(
+                name="staleness_threshold_ms",
+                type=int,
+                default=5000,
+                required=False,
+                description="Max staleness for bounded consistency (ms)",
+            ),
+            "conflict_resolution": NodeParameter(
+                name="conflict_resolution",
+                type=str,
+                default="last_write_wins",
+                required=False,
+                description="Conflict resolution strategy",
+            ),
+        }
+    def __init__(self, **config):
+        """Initialize edge data node."""
+        super().__init__(**config)
+        # Data storage per edge (simulated)
+        self._edge_data: Dict[str, Dict[str, Any]] = {}
+        self._data_versions: Dict[str, Dict[str, int]] = {}
+        self._replication_tasks: Dict[str, asyncio.Task] = {}
+    async def async_run(self, **kwargs) -> Dict[str, Any]:
+        """Execute edge data operation."""
+        # Get action from kwargs first, then from config
+        action = kwargs.get("action") or self.config.get("action", "read")
+        if action == "write":
+            return await self._handle_write(kwargs)
+        elif action == "read":
+            return await self._handle_read(kwargs)
+        elif action == "replicate":
+            return await self._handle_replicate(kwargs)
+        elif action == "sync":
+            return await self._handle_sync(kwargs)
+        else:
+            raise ValueError(f"Unknown action: {action}")
+    async def _handle_write(self, params: Dict[str, Any]) -> Dict[str, Any]:
+        """Handle write operation with consistency guarantees."""
+        key = params.get("key")
+        data = params.get("data")
+        consistency = ConsistencyModel(params.get("consistency", "eventual"))
+        if not key or data is None:
+            raise ValueError("Write requires 'key' and 'data'")
+        # Ensure compliance for data placement
+        if not await self.ensure_compliance({"data": data}):
+            return {"success": False, "error": "No compliant edge available for data"}
+        # Generate version
+        version = self._get_next_version(key)
+        # Store locally first
+        edge_name = self.current_edge.name
+        if edge_name not in self._edge_data:
+            self._edge_data[edge_name] = {}
+            self._data_versions[edge_name] = {}
+        self._edge_data[edge_name][key] = {
+            "data": data,
+            "version": version,
+            "timestamp": datetime.now(UTC).isoformat(),
+            "edge": edge_name,
+        }
+        self._data_versions[edge_name][key] = version
+        # Handle consistency model
+        replication_status = ReplicationStatus()
+        if consistency == ConsistencyModel.STRONG:
+            # Synchronous replication to all replicas
+            await self._replicate_strong(key, data, version, replication_status)
+        else:
+            # Async replication for other models
+            task = asyncio.create_task(
+                self._replicate_async(
+                    key, data, version, consistency, replication_status
+                )
+            )
+            self._replication_tasks[f"{key}:{version}"] = task
+        return {
+            "success": True,
+            "key": key,
+            "version": version,
+            "edge": edge_name,
+            "consistency": consistency.value,
+            "replication_status": {
+                "pending": len(replication_status.pending),
+                "completed": len(replication_status.completed),
+                "failed": len(replication_status.failed),
+            },
+        }
+    async def _handle_read(self, params: Dict[str, Any]) -> Dict[str, Any]:
+        """Handle read operation with consistency awareness."""
+        key = params.get("key")
+        consistency = ConsistencyModel(params.get("consistency", "eventual"))
+        if not key:
+            raise ValueError("Read requires 'key'")
+        # For strong consistency, ensure we have latest version
+        if consistency == ConsistencyModel.STRONG:
+            await self._ensure_latest_version(key)
+        # Find edge with data
+        edge_with_data = await self._find_edge_with_data(key)
+        if not edge_with_data:
+            return {"success": False, "error": f"Key '{key}' not found"}
+        # Get data from edge
+        edge_name, data_entry = edge_with_data
+        # Check staleness for bounded consistency
+        if consistency == ConsistencyModel.BOUNDED_STALENESS:
+            staleness_ms = self._calculate_staleness(data_entry)
+            threshold = params.get("staleness_threshold_ms", 5000)
+            if staleness_ms > threshold:
+                # Try to get fresher data
+                await self._refresh_from_primary(key)
+                edge_with_data = await self._find_edge_with_data(key)
+                if edge_with_data:
+                    edge_name, data_entry = edge_with_data
+        return {
+            "success": True,
+            "key": key,
+            "data": data_entry["data"],
+            "version": data_entry["version"],
+            "timestamp": data_entry["timestamp"],
+            "edge": edge_name,
+            "latency_ms": self._get_edge_latency(edge_name),
+        }
+    async def _handle_replicate(self, params: Dict[str, Any]) -> Dict[str, Any]:
+        """Handle manual replication request."""
+        key = params.get("key")
+        target_edges = params.get("target_edges", [])
+        if not key:
+            raise ValueError("Replicate requires 'key'")
+        # Find source data
+        edge_with_data = await self._find_edge_with_data(key)
+        if not edge_with_data:
+            return {"success": False, "error": f"Key '{key}' not found"}
+        source_edge, data_entry = edge_with_data
+        # Replicate to targets
+        replication_results = {}
+        for target in target_edges:
+            success = await self._replicate_to_edge(
+                target, key, data_entry["data"], data_entry["version"]
+            )
+            replication_results[target] = success
+        return {
+            "success": True,
+            "key": key,
+            "source_edge": source_edge,
+            "replication_results": replication_results,
+        }
+    async def _handle_sync(self, params: Dict[str, Any]) -> Dict[str, Any]:
+        """Handle sync operation to ensure consistency."""
+        keys = params.get("keys", [])
+        sync_results = {}
+        for key in keys:
+            # Find all versions across edges
+            versions = self._get_all_versions(key)
+            if not versions:
+                sync_results[key] = {"status": "not_found"}
+                continue
+            # Determine winning version
+            winner_edge, winner_version = self._resolve_conflict(versions)
+            # Sync winning version to all edges with the key
+            edges_to_sync = [e for e, v in versions.items() if v < winner_version]
+            if edges_to_sync:
+                data_entry = self._edge_data.get(winner_edge, {}).get(key)
+                if data_entry:
+                    for edge in edges_to_sync:
+                        await self._replicate_to_edge(
+                            edge, key, data_entry["data"], winner_version
+                        )
+            sync_results[key] = {
+                "status": "synced",
+                "winner_edge": winner_edge,
+                "winner_version": winner_version,
+                "synced_edges": edges_to_sync,
+            }
+        return {"success": True, "sync_results": sync_results}
+    async def _replicate_strong(
+        self, key: str, data: Any, version: int, status: ReplicationStatus
+    ):
+        """Perform strong consistency replication (2PC)."""
+        # Get target edges
+        target_edges = await self._select_replication_targets()
+        # Phase 1: Prepare
+        prepare_tasks = []
+        for edge in target_edges:
+            status.pending.add(edge.name)
+            prepare_tasks.append(self._prepare_replication(edge, key, data, version))
+        prepare_results = await asyncio.gather(*prepare_tasks, return_exceptions=True)
+        # Check if all prepared successfully
+        prepared_edges = []
+        for edge, result in zip(target_edges, prepare_results):
+            if isinstance(result, Exception) or not result:
+                status.failed.add(edge.name)
+                status.pending.discard(edge.name)
+            else:
+                prepared_edges.append(edge)
+        # Phase 2: Commit or Abort
+        if len(prepared_edges) == len(target_edges):
+            # All prepared - commit
+            commit_tasks = []
+            for edge in prepared_edges:
+                commit_tasks.append(self._commit_replication(edge, key, version))
+            await asyncio.gather(*commit_tasks, return_exceptions=True)
+            for edge in prepared_edges:
+                status.completed.add(edge.name)
+                status.pending.discard(edge.name)
+        else:
+            # Some failed - abort
+            abort_tasks = []
+            for edge in prepared_edges:
+                abort_tasks.append(self._abort_replication(edge, key, version))
+            await asyncio.gather(*abort_tasks, return_exceptions=True)
+            raise RuntimeError(
+                f"Strong consistency replication failed. "
+                f"Only {len(prepared_edges)}/{len(target_edges)} edges prepared."
+            )
+    async def _replicate_async(
+        self,
+        key: str,
+        data: Any,
+        version: int,
+        consistency: ConsistencyModel,
+        status: ReplicationStatus,
+    ):
+        """Perform async replication for eventual/causal/bounded consistency."""
+        target_edges = await self._select_replication_targets()
+        tasks = []
+        for edge in target_edges:
+            status.pending.add(edge.name)
+            if consistency == ConsistencyModel.CAUSAL:
+                # Add causal dependency tracking
+                task = self._replicate_causal(edge, key, data, version)
+            else:
+                # Simple async replication
+                task = self._replicate_to_edge(edge.name, key, data, version)
+            tasks.append(task)
+        results = await asyncio.gather(*tasks, return_exceptions=True)
+        for edge, result in zip(target_edges, results):
+            if isinstance(result, Exception) or not result:
+                status.failed.add(edge.name)
+            else:
+                status.completed.add(edge.name)
+            status.pending.discard(edge.name)
+    async def _select_replication_targets(self) -> List[EdgeLocation]:
+        """Select edges for replication based on strategy."""
+        all_edges = self.edge_discovery.get_all_edges()
+        # Remove current edge
+        target_edges = [e for e in all_edges if e.name != self.current_edge.name]
+        # Filter by compliance if needed
+        if self.compliance_zones:
+            target_edges = [
+                e
+                for e in target_edges
+                if any(zone in e.compliance_zones for zone in self.compliance_zones)
+            ]
+        # Sort by strategy and take replication_factor - 1 (current edge is 1)
+        target_edges = sorted(
+            target_edges,
+            key=lambda e: (e.metrics.latency_p50_ms, e.metrics.network_cost_per_gb),
+        )
+        return target_edges[: self.config.get("replication_factor", 3) - 1]
+    async def _replicate_to_edge(
+        self, edge_name: str, key: str, data: Any, version: int
+    ) -> bool:
+        """Replicate data to specific edge."""
+        try:
+            # Simulate network replication
+            await asyncio.sleep(0.05)  # 50ms replication latency
+            # Store in edge data
+            if edge_name not in self._edge_data:
+                self._edge_data[edge_name] = {}
+                self._data_versions[edge_name] = {}
+            self._edge_data[edge_name][key] = {
+                "data": data,
+                "version": version,
+                "timestamp": datetime.now(UTC).isoformat(),
+                "edge": edge_name,
+            }
+            self._data_versions[edge_name][key] = version
+            return True
+        except Exception as e:
+            self.logger.error(f"Replication to {edge_name} failed: {e}")
+            return False
+    async def _prepare_replication(
+        self, edge: EdgeLocation, key: str, data: Any, version: int
+    ) -> bool:
+        """Prepare phase of 2PC replication."""
+        # Simulate prepare phase
+        await asyncio.sleep(0.02)
+        # Check if edge can accept the write
+        if edge.metrics.storage_utilization > 0.95:  # 95% full
+            return False
+        return True
+    async def _commit_replication(
+        self, edge: EdgeLocation, key: str, version: int
+    ) -> bool:
+        """Commit phase of 2PC replication."""
+        # Actually replicate the data
+        data_entry = self._edge_data.get(self.current_edge.name, {}).get(key)
+        if data_entry:
+            return await self._replicate_to_edge(
+                edge.name, key, data_entry["data"], version
+            )
+        return False
+    async def _abort_replication(
+        self, edge: EdgeLocation, key: str, version: int
+    ) -> bool:
+        """Abort phase of 2PC replication."""
+        # Clean up any prepared state
+        await asyncio.sleep(0.01)
+        return True
+    async def _replicate_causal(
+        self, edge: EdgeLocation, key: str, data: Any, version: int
+    ) -> bool:
+        """Replicate with causal consistency tracking."""
+        # Add causal dependency metadata
+        causal_data = {
+            "data": data,
+            "version": version,
+            "causal_deps": self._get_causal_dependencies(key),
+            "timestamp": datetime.now(UTC).isoformat(),
+        }
+        return await self._replicate_to_edge(edge.name, key, causal_data, version)
+    def _get_next_version(self, key: str) -> int:
+        """Get next version number for a key."""
+        max_version = 0
+        for edge_versions in self._data_versions.values():
+            if key in edge_versions:
+                max_version = max(max_version, edge_versions[key])
+        return max_version + 1
+    async def _find_edge_with_data(
+        self, key: str
+    ) -> Optional[tuple[str, Dict[str, Any]]]:
+        """Find edge that has the requested data."""
+        # First check current edge
+        if self.current_edge:
+            edge_name = self.current_edge.name
+            if edge_name in self._edge_data and key in self._edge_data[edge_name]:
+                return (edge_name, self._edge_data[edge_name][key])
+        # Check other edges by latency
+        edges_by_latency = sorted(
+            self.edge_discovery.get_all_edges(), key=lambda e: e.metrics.latency_p50_ms
+        )
+        for edge in edges_by_latency:
+            if edge.name in self._edge_data and key in self._edge_data[edge.name]:
+                return (edge.name, self._edge_data[edge.name][key])
+        return None
+    def _calculate_staleness(self, data_entry: Dict[str, Any]) -> float:
+        """Calculate data staleness in milliseconds."""
+        timestamp_str = data_entry["timestamp"]
+        # Handle both timezone-aware and naive timestamps
+        if timestamp_str.endswith("Z"):
+            timestamp_str = timestamp_str[:-1] + "+00:00"
+        timestamp = datetime.fromisoformat(timestamp_str)
+        # Make sure timestamp is timezone-aware
+        if timestamp.tzinfo is None:
+            timestamp = timestamp.replace(tzinfo=UTC)
+        staleness = datetime.now(UTC) - timestamp
+        return staleness.total_seconds() * 1000
+    def _get_edge_latency(self, edge_name: str) -> float:
+        """Get latency to specific edge."""
+        edge = self.edge_discovery.get_edge(edge_name)
+        return edge.metrics.latency_p50_ms if edge else 0.0
+    def _get_all_versions(self, key: str) -> Dict[str, int]:
+        """Get all versions of a key across edges."""
+        versions = {}
+        for edge_name, edge_versions in self._data_versions.items():
+            if key in edge_versions:
+                versions[edge_name] = edge_versions[key]
+        return versions
+    def _resolve_conflict(self, versions: Dict[str, int]) -> tuple[str, int]:
+        """Resolve version conflict using configured strategy."""
+        # For now, last write wins (highest version)
+        if not versions:
+            return (None, 0)
+        winner_edge = max(versions.items(), key=lambda x: x[1])
+        return winner_edge
+    async def _ensure_latest_version(self, key: str):
+        """Ensure we have the latest version for strong consistency."""
+        # In production, this would check with other edges
+        await asyncio.sleep(0.01)  # Simulate version check
+    async def _refresh_from_primary(self, key: str):
+        """Refresh data from primary edge for bounded staleness."""
+        # In production, this would fetch from primary
+        await asyncio.sleep(0.02)  # Simulate refresh
+    def _get_causal_dependencies(self, key: str) -> List[str]:
+        """Get causal dependencies for a key."""
+        # In production, track actual dependencies
+        return []
+    async def cleanup(self):
+        """Cleanup resources including replication tasks."""
+        # Cancel all replication tasks
+        tasks_to_cancel = []
+        for task_id, task in self._replication_tasks.items():
+            if not task.done():
+                task.cancel()
+                tasks_to_cancel.append(task)
+        # Wait for all cancelled tasks to complete
+        if tasks_to_cancel:
+            await asyncio.gather(*tasks_to_cancel, return_exceptions=True)
+        # Clear the task registry
+        self._replication_tasks.clear()

kailash 0.8.4__py3-none-any.whl → 0.8.6__py3-none-any.whl

kailash 0.8.4py3-none-any.whl → 0.8.6py3-none-any.whl