PyPI - mcp-mesh - Versions diffs - 0.7.12__py3-none-any.whl → 0.7.14__py3-none-any.whl - Mend

mcp-mesh 0.7.12py3-none-any.whl → 0.7.14py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

_mcp_mesh/__init__.py +1 -1
_mcp_mesh/engine/__init__.py +1 -22
_mcp_mesh/engine/async_mcp_client.py +88 -25
_mcp_mesh/engine/decorator_registry.py +10 -9
_mcp_mesh/engine/dependency_injector.py +64 -53
_mcp_mesh/engine/mesh_llm_agent.py +119 -5
_mcp_mesh/engine/mesh_llm_agent_injector.py +30 -0
_mcp_mesh/engine/session_aware_client.py +3 -3
_mcp_mesh/engine/unified_mcp_proxy.py +82 -90
_mcp_mesh/pipeline/api_heartbeat/api_dependency_resolution.py +0 -89
_mcp_mesh/pipeline/api_heartbeat/api_fast_heartbeat_check.py +3 -3
_mcp_mesh/pipeline/api_heartbeat/api_heartbeat_pipeline.py +30 -28
_mcp_mesh/pipeline/mcp_heartbeat/dependency_resolution.py +16 -18
_mcp_mesh/pipeline/mcp_heartbeat/fast_heartbeat_check.py +5 -5
_mcp_mesh/pipeline/mcp_heartbeat/heartbeat_orchestrator.py +3 -3
_mcp_mesh/pipeline/mcp_heartbeat/heartbeat_pipeline.py +6 -6
_mcp_mesh/pipeline/mcp_heartbeat/heartbeat_send.py +1 -1
_mcp_mesh/pipeline/mcp_heartbeat/llm_tools_resolution.py +15 -11
_mcp_mesh/pipeline/mcp_heartbeat/registry_connection.py +3 -3
_mcp_mesh/pipeline/mcp_startup/fastapiserver_setup.py +37 -268
_mcp_mesh/pipeline/mcp_startup/lifespan_factory.py +142 -0
_mcp_mesh/pipeline/mcp_startup/startup_orchestrator.py +57 -93
_mcp_mesh/pipeline/shared/registry_connection.py +1 -1
_mcp_mesh/shared/health_check_manager.py +313 -0
_mcp_mesh/shared/logging_config.py +190 -7
_mcp_mesh/shared/registry_client_wrapper.py +8 -8
_mcp_mesh/shared/sse_parser.py +19 -17
_mcp_mesh/tracing/execution_tracer.py +26 -1
_mcp_mesh/tracing/fastapi_tracing_middleware.py +3 -4
_mcp_mesh/tracing/trace_context_helper.py +25 -6
{mcp_mesh-0.7.12.dist-info → mcp_mesh-0.7.14.dist-info}/METADATA +1 -1
{mcp_mesh-0.7.12.dist-info → mcp_mesh-0.7.14.dist-info}/RECORD +38 -39
mesh/__init__.py +3 -1
mesh/decorators.py +81 -43
mesh/helpers.py +72 -4
mesh/types.py +48 -4
_mcp_mesh/engine/full_mcp_proxy.py +0 -641
_mcp_mesh/engine/mcp_client_proxy.py +0 -457
_mcp_mesh/shared/health_check_cache.py +0 -246
{mcp_mesh-0.7.12.dist-info → mcp_mesh-0.7.14.dist-info}/WHEEL +0 -0
{mcp_mesh-0.7.12.dist-info → mcp_mesh-0.7.14.dist-info}/licenses/LICENSE +0 -0

_mcp_mesh/pipeline/mcp_startup/startup_orchestrator.py CHANGED Viewed

@@ -120,11 +120,15 @@ class DebounceCoordinator:
     def _execute_processing(self) -> None:
         """Execute the processing (called by timer)."""
-        try:
+        # Copy orchestrator reference under lock to prevent race with cleanup()
+        with self._lock:
+            orchestrator = self._orchestrator
-            if self._orchestrator is None:
-                self.logger.error("❌ No orchestrator set for processing")
-                return
+        if orchestrator is None:
+            self.logger.error("❌ No orchestrator set for processing")
+            return
+        try:
             self.logger.info(
                 f"🚀 Debounce delay ({self.delay_seconds}s) complete, processing all decorators"
@@ -160,10 +164,10 @@ class DebounceCoordinator:
                 # Execute appropriate pipeline based on type
                 if pipeline_type == "mcp":
                     # Phase 1: Run async MCP pipeline setup
-                    result = asyncio.run(self._orchestrator.process_once())
+                    result = asyncio.run(orchestrator.process_once())
                 elif pipeline_type == "api":
                     # Phase 1: Run async API pipeline setup
-                    result = asyncio.run(self._orchestrator.process_api_once())
+                    result = asyncio.run(orchestrator.process_api_once())
                 else:
                     raise RuntimeError(f"Unsupported pipeline type: {pipeline_type}")
@@ -177,8 +181,16 @@ class DebounceCoordinator:
                     # For API services, ONLY do dependency injection - user controls their FastAPI server
                     # Dependency injection is already complete from pipeline execution
                     # Optionally start heartbeat in background (non-blocking)
-                    self._setup_api_heartbeat_background(
-                        heartbeat_config, pipeline_context
+                    from ..api_heartbeat.api_lifespan_integration import (
+                        api_heartbeat_lifespan_task,
+                    )
+                    self._setup_heartbeat_background(
+                        heartbeat_config,
+                        pipeline_context,
+                        api_heartbeat_lifespan_task,
+                        id_field="service_id",
+                        label="API service",
                     )
                     self.logger.info(
                         "✅ API dependency injection complete - user's FastAPI server can now start"
@@ -186,8 +198,14 @@ class DebounceCoordinator:
                     return  # Don't block - let user's uvicorn run
                 elif fastapi_app and binding_config:
                     # For MCP agents - use same daemon thread pattern as API apps
-                    self._setup_mcp_heartbeat_background(
-                        heartbeat_config, pipeline_context
+                    from ..mcp_heartbeat.lifespan_integration import (
+                        heartbeat_lifespan_task,
+                    )
+                    self._setup_heartbeat_background(
+                        heartbeat_config,
+                        pipeline_context,
+                        heartbeat_lifespan_task,
                     )
                     # Check if server was already reused from immediate uvicorn start
@@ -268,9 +286,9 @@ class DebounceCoordinator:
                 self.logger.info("🏁 Auto-run disabled - single execution mode")
                 if pipeline_type == "mcp":
-                    result = asyncio.run(self._orchestrator.process_once())
+                    result = asyncio.run(orchestrator.process_once())
                 elif pipeline_type == "api":
-                    result = asyncio.run(self._orchestrator.process_api_once())
+                    result = asyncio.run(orchestrator.process_api_once())
                 else:
                     raise RuntimeError(f"Unsupported pipeline type: {pipeline_type}")
@@ -311,119 +329,65 @@ class DebounceCoordinator:
             self.logger.error(f"❌ FastAPI server error: {e}")
             raise
-    def _setup_api_heartbeat_background(
-        self, heartbeat_config: dict[str, Any], pipeline_context: dict[str, Any]
+    def _setup_heartbeat_background(
+        self,
+        heartbeat_config: dict[str, Any],
+        pipeline_context: dict[str, Any],
+        heartbeat_task_fn: Any,
+        id_field: str = "agent_id",
+        label: str = "MCP agent",
     ) -> None:
-        """Setup API heartbeat to run in background - non-blocking."""
-        try:
-            # Populate heartbeat context with current pipeline context
-            heartbeat_config["context"] = pipeline_context
-            service_id = heartbeat_config.get("service_id", "unknown")
-            standalone_mode = heartbeat_config.get("standalone_mode", False)
-            if standalone_mode:
-                self.logger.info(
-                    f"📝 API service '{service_id}' configured in standalone mode - no heartbeat"
-                )
-                return
-            self.logger.info(
-                f"🔗 Setting up background API heartbeat for service '{service_id}'"
-            )
-            # Import heartbeat functionality
-            import asyncio
-            import threading
-            from ..api_heartbeat.api_lifespan_integration import (
-                api_heartbeat_lifespan_task,
-            )
-            def run_heartbeat():
-                """Run heartbeat in separate thread with its own event loop."""
-                self.logger.debug(
-                    f"Starting background heartbeat thread for {service_id}"
-                )
-                try:
-                    # Create new event loop for this thread
-                    loop = asyncio.new_event_loop()
-                    asyncio.set_event_loop(loop)
-                    # Run heartbeat task
-                    loop.run_until_complete(
-                        api_heartbeat_lifespan_task(heartbeat_config)
-                    )
-                except Exception as e:
-                    self.logger.error(f"❌ Background heartbeat error: {e}")
-                finally:
-                    loop.close()
-            # Start heartbeat in daemon thread (won't prevent process exit)
-            heartbeat_thread = threading.Thread(target=run_heartbeat, daemon=True)
-            heartbeat_thread.start()
+        """
+        Setup heartbeat to run in background thread.
-            self.logger.info(
-                f"💓 Background API heartbeat thread started for service '{service_id}'"
-            )
+        Unified implementation for both API services and MCP agents.
-        except Exception as e:
-            self.logger.warning(f"⚠️ Could not setup API heartbeat: {e}")
-            # Don't fail - heartbeat is optional for API services
+        Args:
+            heartbeat_config: Heartbeat configuration dict
+            pipeline_context: Pipeline context to populate into config
+            heartbeat_task_fn: Async function to run (api or mcp heartbeat task)
+            id_field: Config key for ID ("agent_id" or "service_id")
+            label: Label for log messages ("MCP agent" or "API service")
+        """
+        import asyncio
+        import threading
-    def _setup_mcp_heartbeat_background(
-        self, heartbeat_config: dict[str, Any], pipeline_context: dict[str, Any]
-    ) -> None:
-        """Setup MCP heartbeat to run in background - same pattern as API apps."""
         try:
-            # Populate heartbeat context with current pipeline context
             heartbeat_config["context"] = pipeline_context
-            agent_id = heartbeat_config.get("agent_id", "unknown")
+            entity_id = heartbeat_config.get(id_field, "unknown")
             standalone_mode = heartbeat_config.get("standalone_mode", False)
             if standalone_mode:
                 self.logger.info(
-                    f"📝 MCP agent '{agent_id}' configured in standalone mode - no heartbeat"
+                    f"{label} '{entity_id}' configured in standalone mode - no heartbeat"
                 )
                 return
             self.logger.info(
-                f"🔗 Setting up background MCP heartbeat for agent '{agent_id}'"
+                f"Setting up background heartbeat for {label} '{entity_id}'"
             )
-            # Import heartbeat functionality
-            import asyncio
-            import threading
-            from ..mcp_heartbeat.lifespan_integration import heartbeat_lifespan_task
             def run_heartbeat():
                 """Run heartbeat in separate thread with its own event loop."""
-                self.logger.debug(
-                    f"Starting background heartbeat thread for {agent_id}"
-                )
+                self.logger.debug(f"Starting background heartbeat thread for {entity_id}")
                 try:
-                    # Create new event loop for this thread
                     loop = asyncio.new_event_loop()
                     asyncio.set_event_loop(loop)
-                    # Run heartbeat task
-                    loop.run_until_complete(heartbeat_lifespan_task(heartbeat_config))
+                    loop.run_until_complete(heartbeat_task_fn(heartbeat_config))
                 except Exception as e:
-                    self.logger.error(f"❌ Background heartbeat error: {e}")
+                    self.logger.error(f"Background heartbeat error: {e}")
                 finally:
                     loop.close()
-            # Start heartbeat in daemon thread (won't prevent process exit)
             heartbeat_thread = threading.Thread(target=run_heartbeat, daemon=True)
             heartbeat_thread.start()
             self.logger.info(
-                f"💓 Background MCP heartbeat thread started for agent '{agent_id}'"
+                f"Background heartbeat thread started for {label} '{entity_id}'"
             )
         except Exception as e:
-            self.logger.warning(f"⚠️ Could not setup MCP heartbeat: {e}")
-            # Don't fail - heartbeat is optional for MCP agents
+            self.logger.warning(f"Could not setup {label} heartbeat: {e}")
     # Graceful shutdown is now handled by FastAPI lifespan in simple_shutdown.py

_mcp_mesh/pipeline/shared/registry_connection.py CHANGED Viewed

@@ -65,7 +65,7 @@ class RegistryConnectionStep(PipelineStep):
             result.add_context("registry_wrapper", registry_wrapper)
             result.message = f"Connected to registry at {registry_url}"
-            self.logger.info(f"🔗 Registry connection established: {registry_url}")
+            self.logger.trace(f"🔗 Registry connection established: {registry_url}")
         except Exception as e:
             result.status = PipelineStatus.FAILED

_mcp_mesh/shared/health_check_manager.py ADDED Viewed

@@ -0,0 +1,313 @@
+"""
+Health check manager with TTL caching and K8s response helpers.
+Consolidates health check storage, caching, and Kubernetes endpoint response
+generation into a single module.
+"""
+import logging
+import time
+from collections.abc import Awaitable, Callable
+from datetime import UTC, datetime
+from typing import Any
+from .support_types import HealthStatus, HealthStatusType
+logger = logging.getLogger(__name__)
+# =============================================================================
+# Health Result Storage (moved from DecoratorRegistry)
+# =============================================================================
+# Simple storage for the latest health check result dict
+# Format: {"status": "healthy/degraded/unhealthy", "agent": "...", ...}
+_health_check_result: dict | None = None
+def store_health_check_result(result: dict) -> None:
+    """Store health check result for K8s endpoints."""
+    global _health_check_result
+    _health_check_result = result
+    logger.debug(f"Stored health check result: {result.get('status', 'unknown')}")
+def get_health_check_result() -> dict | None:
+    """Get stored health check result."""
+    return _health_check_result
+def clear_health_check_result() -> None:
+    """Clear stored health check result."""
+    global _health_check_result
+    _health_check_result = None
+    logger.debug("Cleared health check result")
+# =============================================================================
+# TTL-Based Health Cache
+# =============================================================================
+# Global cache for HealthStatus objects with per-key TTL
+# Format: {"health:agent_id": (HealthStatus, expiry_timestamp)}
+_health_cache: dict[str, tuple[HealthStatus, float]] = {}
+_max_cache_size = 100
+async def get_health_status_with_cache(
+    agent_id: str,
+    health_check_fn: Callable[[], Awaitable[Any]] | None,
+    agent_config: dict[str, Any],
+    startup_context: dict[str, Any],
+    ttl: int = 15,
+) -> HealthStatus:
+    """
+    Get health status with TTL caching.
+    User health check can return:
+    - bool: True = HEALTHY, False = UNHEALTHY
+    - dict: {"status": "healthy/degraded/unhealthy", "checks": {...}, "errors": [...]}
+    - HealthStatus: Full object
+    Args:
+        agent_id: Unique identifier for the agent
+        health_check_fn: Optional async function for health check
+        agent_config: Agent configuration dict
+        startup_context: Full startup context with capabilities
+        ttl: Cache TTL in seconds (default: 15)
+    Returns:
+        HealthStatus from cache or fresh check
+    """
+    cache_key = f"health:{agent_id}"
+    current_time = time.time()
+    # Check cache
+    if cache_key in _health_cache:
+        cached_status, expiry_time = _health_cache[cache_key]
+        if current_time < expiry_time:
+            logger.debug(f"Health check cache HIT for agent '{agent_id}'")
+            return cached_status
+        else:
+            logger.debug(f"Health check cache EXPIRED for agent '{agent_id}'")
+            del _health_cache[cache_key]
+    logger.debug(f"Health check cache MISS for agent '{agent_id}'")
+    # Execute health check
+    health_status = await _execute_health_check(
+        agent_id, health_check_fn, agent_config, startup_context
+    )
+    # Store in cache
+    expiry_time = current_time + ttl
+    _health_cache[cache_key] = (health_status, expiry_time)
+    logger.debug(f"Cached health status for '{agent_id}' with TTL={ttl}s")
+    # Enforce max cache size
+    if len(_health_cache) > _max_cache_size:
+        oldest_key = min(_health_cache.keys(), key=lambda k: _health_cache[k][1])
+        del _health_cache[oldest_key]
+        logger.debug("Evicted oldest cache entry to maintain max size")
+    return health_status
+async def _execute_health_check(
+    agent_id: str,
+    health_check_fn: Callable[[], Awaitable[Any]] | None,
+    agent_config: dict[str, Any],
+    startup_context: dict[str, Any],
+) -> HealthStatus:
+    """Execute health check function and build HealthStatus."""
+    capabilities = _get_capabilities(startup_context, agent_config)
+    if health_check_fn:
+        try:
+            logger.debug(f"Executing health check for agent '{agent_id}'")
+            user_result = await health_check_fn()
+            status_type, checks, errors = _parse_health_result(user_result)
+            logger.info(f"Health check for '{agent_id}': {status_type.value}")
+        except Exception as e:
+            logger.warning(f"Health check failed for agent '{agent_id}': {e}")
+            status_type = HealthStatusType.DEGRADED
+            checks = {"health_check_execution": False}
+            errors = [f"Health check failed: {str(e)}"]
+    else:
+        # No health check provided - default to HEALTHY
+        logger.debug(f"No health check for '{agent_id}', using default HEALTHY")
+        status_type = HealthStatusType.HEALTHY
+        checks = {}
+        errors = []
+    return HealthStatus(
+        agent_name=agent_id,
+        status=status_type,
+        capabilities=capabilities,
+        checks=checks,
+        errors=errors,
+        timestamp=datetime.now(UTC),
+        version=agent_config.get("version", "1.0.0"),
+        metadata=agent_config,
+        uptime_seconds=0,
+    )
+def _get_capabilities(
+    startup_context: dict[str, Any],
+    agent_config: dict[str, Any],
+) -> list[str]:
+    """Get capabilities from context with fallbacks."""
+    capabilities = startup_context.get("capabilities", [])
+    if not capabilities:
+        capabilities = agent_config.get("capabilities", [])
+    if not capabilities:
+        capabilities = ["default"]
+    return capabilities
+def _parse_health_result(
+    user_result: Any,
+) -> tuple[HealthStatusType, dict, list]:
+    """Parse user health check result into status, checks, errors."""
+    if isinstance(user_result, bool):
+        status_type = (
+            HealthStatusType.HEALTHY if user_result else HealthStatusType.UNHEALTHY
+        )
+        checks = {"health_check": user_result}
+        errors = [] if user_result else ["Health check returned False"]
+    elif isinstance(user_result, dict):
+        status_str = user_result.get("status", "healthy").lower()
+        status_map = {
+            "healthy": HealthStatusType.HEALTHY,
+            "degraded": HealthStatusType.DEGRADED,
+            "unhealthy": HealthStatusType.UNHEALTHY,
+        }
+        status_type = status_map.get(status_str, HealthStatusType.UNKNOWN)
+        checks = user_result.get("checks", {})
+        errors = user_result.get("errors", [])
+    elif isinstance(user_result, HealthStatus):
+        status_type = user_result.status
+        checks = user_result.checks
+        errors = user_result.errors
+    else:
+        logger.warning(f"Unexpected health check result type: {type(user_result)}")
+        status_type = HealthStatusType.UNHEALTHY
+        checks = {"health_check_return_type": False}
+        errors = [f"Invalid return type: {type(user_result)}"]
+    return status_type, checks, errors
+def clear_health_cache(agent_id: str | None = None) -> None:
+    """Clear health cache for a specific agent or all agents."""
+    if agent_id:
+        cache_key = f"health:{agent_id}"
+        if cache_key in _health_cache:
+            del _health_cache[cache_key]
+            logger.debug(f"Cleared health cache for agent '{agent_id}'")
+    else:
+        _health_cache.clear()
+        logger.debug("Cleared entire health cache")
+def get_cache_stats() -> dict[str, Any]:
+    """Get cache statistics for monitoring."""
+    return {
+        "size": len(_health_cache),
+        "maxsize": _max_cache_size,
+        "ttl": 15,
+        "cached_agents": [key.replace("health:", "") for key in _health_cache.keys()],
+    }
+# =============================================================================
+# K8s Response Helpers
+# =============================================================================
+def build_health_response(
+    agent_name: str,
+    health_status: HealthStatus | None = None,
+) -> tuple[dict, int]:
+    """
+    Build /health endpoint response with appropriate HTTP status code.
+    Returns:
+        Tuple of (response_dict, http_status_code)
+    """
+    if health_status:
+        status = health_status.status.value
+        response = {
+            "status": status,
+            "agent": agent_name,
+            "checks": health_status.checks,
+            "errors": health_status.errors,
+            "timestamp": health_status.timestamp.isoformat(),
+        }
+    else:
+        # Use stored result if available
+        stored = get_health_check_result()
+        if stored:
+            status = stored.get("status", "starting")
+            response = stored
+        else:
+            status = "starting"
+            response = {"status": "starting", "message": "Agent is starting"}
+    # K8s expects 200 for healthy, 503 for everything else
+    http_status = 200 if status == "healthy" else 503
+    return response, http_status
+def build_ready_response(
+    agent_name: str,
+    mcp_wrappers_count: int = 0,
+) -> tuple[dict, int]:
+    """
+    Build /ready endpoint response with appropriate HTTP status code.
+    Returns:
+        Tuple of (response_dict, http_status_code)
+    """
+    stored = get_health_check_result()
+    if stored:
+        status = stored.get("status", "starting")
+        if status == "healthy":
+            return {
+                "ready": True,
+                "agent": agent_name,
+                "status": status,
+                "mcp_wrappers": mcp_wrappers_count,
+                "timestamp": datetime.now(UTC).isoformat(),
+            }, 200
+        else:
+            return {
+                "ready": False,
+                "agent": agent_name,
+                "status": status,
+                "reason": f"Service is {status}",
+                "errors": stored.get("errors", []),
+            }, 503
+    else:
+        # No health check configured - assume ready
+        return {
+            "ready": True,
+            "agent": agent_name,
+            "mcp_wrappers": mcp_wrappers_count,
+            "timestamp": datetime.now(UTC).isoformat(),
+        }, 200
+def build_livez_response(agent_name: str) -> dict:
+    """Build /livez endpoint response (always returns 200)."""
+    return {
+        "alive": True,
+        "agent": agent_name,
+        "timestamp": datetime.now(UTC).isoformat(),
+    }

mcp-mesh 0.7.12__py3-none-any.whl → 0.7.14__py3-none-any.whl

mcp-mesh 0.7.12py3-none-any.whl → 0.7.14py3-none-any.whl