PyPI - kubectl-mcp-server - Versions diffs - 1.16.0__py3-none-any.whl → 1.17.0__py3-none-any.whl - Mend

kubectl-mcp-server 1.16.0py3-none-any.whl → 1.17.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

{kubectl_mcp_server-1.16.0.dist-info → kubectl_mcp_server-1.17.0.dist-info}/METADATA +1 -1
{kubectl_mcp_server-1.16.0.dist-info → kubectl_mcp_server-1.17.0.dist-info}/RECORD +28 -14
kubectl_mcp_tool/__init__.py +1 -1
kubectl_mcp_tool/cli/cli.py +83 -9
kubectl_mcp_tool/cli/output.py +14 -0
kubectl_mcp_tool/config/__init__.py +46 -0
kubectl_mcp_tool/config/loader.py +386 -0
kubectl_mcp_tool/config/schema.py +184 -0
kubectl_mcp_tool/mcp_server.py +219 -8
kubectl_mcp_tool/observability/__init__.py +59 -0
kubectl_mcp_tool/observability/metrics.py +223 -0
kubectl_mcp_tool/observability/stats.py +255 -0
kubectl_mcp_tool/observability/tracing.py +335 -0
kubectl_mcp_tool/prompts/__init__.py +43 -0
kubectl_mcp_tool/prompts/builtin.py +695 -0
kubectl_mcp_tool/prompts/custom.py +298 -0
kubectl_mcp_tool/prompts/prompts.py +180 -4
kubectl_mcp_tool/safety.py +155 -0
kubectl_mcp_tool/tools/cluster.py +384 -0
tests/test_config.py +386 -0
tests/test_mcp_integration.py +251 -0
tests/test_observability.py +521 -0
tests/test_prompts.py +716 -0
tests/test_safety.py +218 -0
{kubectl_mcp_server-1.16.0.dist-info → kubectl_mcp_server-1.17.0.dist-info}/WHEEL +0 -0
{kubectl_mcp_server-1.16.0.dist-info → kubectl_mcp_server-1.17.0.dist-info}/entry_points.txt +0 -0
{kubectl_mcp_server-1.16.0.dist-info → kubectl_mcp_server-1.17.0.dist-info}/licenses/LICENSE +0 -0
{kubectl_mcp_server-1.16.0.dist-info → kubectl_mcp_server-1.17.0.dist-info}/top_level.txt +0 -0

kubectl_mcp_tool/mcp_server.py CHANGED Viewed

@@ -23,12 +23,49 @@ import logging
 import asyncio
 import os
 import platform
-from typing import List, Optional, Any
+import signal
+from pathlib import Path
+from typing import List, Optional, Any, Dict
 # Import k8s_config early to patch kubernetes config for in-cluster support
 # This must be done before any tools are imported
 import kubectl_mcp_tool.k8s_config  # noqa: F401
+# Import safety mode for operation control
+from kubectl_mcp_tool.safety import (
+    SafetyMode,
+    set_safety_mode,
+    get_safety_mode,
+    get_mode_info,
+)
+# Import observability for metrics and tracing
+from kubectl_mcp_tool.observability import (
+    get_stats_collector,
+    get_metrics,
+    init_tracing,
+    shutdown_tracing,
+    is_prometheus_available,
+    is_tracing_available,
+    record_tool_call_metric,
+    record_tool_duration_metric,
+    record_tool_error_metric,
+)
+# Import config loader
+from kubectl_mcp_tool.config import (
+    load_config,
+    get_config,
+    register_reload_callback,
+    setup_sighup_handler,
+)
+# Import custom prompts
+from kubectl_mcp_tool.prompts import (
+    load_prompts_from_config,
+    get_builtin_prompts,
+)
 from kubectl_mcp_tool.tools import (
     register_helm_tools,
     register_pod_tools,
@@ -116,12 +153,20 @@ except ImportError:
 class MCPServer:
     """MCP server implementation."""
-    def __init__(self, name: str, non_destructive: bool = False):
+    def __init__(
+        self,
+        name: str,
+        read_only: bool = False,
+        disable_destructive: bool = False,
+        config_file: Optional[str] = None,
+    ):
         """Initialize the MCP server.
         Args:
             name: Server name for identification
-            non_destructive: If True, block destructive operations
+            read_only: If True, block all write operations (read-only mode)
+            disable_destructive: If True, block only destructive operations
+            config_file: Optional path to TOML config file
         Environment Variables:
             MCP_AUTH_ENABLED: Enable OAuth 2.1 authentication (default: false)
@@ -131,9 +176,29 @@ class MCPServer:
             MCP_AUTH_REQUIRED_SCOPES: Required scopes (default: mcp:tools)
         """
         self.name = name
-        self.non_destructive = non_destructive
         self._dependencies_checked = False
         self._dependencies_available = None
+        self._stats = get_stats_collector()
+        # Persist CLI safety overrides for reloads
+        self._cli_read_only = read_only
+        self._cli_disable_destructive = disable_destructive
+        # Load configuration from file and environment
+        self.config = self._load_configuration(config_file)
+        # Apply safety mode from config or parameters
+        self._apply_safety_mode(self._cli_read_only, self._cli_disable_destructive)
+        # For backward compatibility, expose non_destructive
+        self.non_destructive = get_safety_mode() != SafetyMode.NORMAL
+        # Initialize observability (tracing, metrics)
+        self._init_observability()
+        # Register config reload callback and set up SIGHUP handler
+        register_reload_callback(self._on_config_reload)
+        setup_sighup_handler()
         # Load authentication configuration
         self.auth_config = get_auth_config()
@@ -150,6 +215,71 @@ class MCPServer:
         self.setup_resources()
         self.setup_prompts()
+        # Log startup info
+        mode_info = get_mode_info()
+        logger.info(f"MCP Server initialized: {name}")
+        logger.info(f"Safety mode: {mode_info['mode']} - {mode_info['description']}")
+    def _load_configuration(self, config_file: Optional[str]) -> Any:
+        """Load configuration from TOML file and environment."""
+        try:
+            config = load_config(config_file=config_file if config_file else None)
+            logger.debug(f"Configuration loaded successfully")
+            return config
+        except Exception as e:
+            logger.warning(f"Failed to load config file: {e}. Using defaults.")
+            return load_config(skip_env=False)
+    def _apply_safety_mode(self, read_only: bool, disable_destructive: bool) -> None:
+        """Apply safety mode from config or CLI parameters.
+        CLI parameters take precedence over config file settings.
+        """
+        # Check config first
+        config_mode = getattr(self.config.safety, 'mode', 'normal') if hasattr(self.config, 'safety') else 'normal'
+        # CLI parameters override config
+        if read_only:
+            set_safety_mode(SafetyMode.READ_ONLY)
+        elif disable_destructive:
+            set_safety_mode(SafetyMode.DISABLE_DESTRUCTIVE)
+        elif config_mode == 'read-only' or config_mode == 'read_only':
+            set_safety_mode(SafetyMode.READ_ONLY)
+        elif config_mode == 'disable-destructive' or config_mode == 'disable_destructive':
+            set_safety_mode(SafetyMode.DISABLE_DESTRUCTIVE)
+        else:
+            set_safety_mode(SafetyMode.NORMAL)
+    def _init_observability(self) -> None:
+        """Initialize observability components (tracing, metrics)."""
+        # Check if tracing is enabled in config
+        tracing_enabled = getattr(self.config.metrics, 'tracing_enabled', False) if hasattr(self.config, 'metrics') else False
+        otlp_endpoint = getattr(self.config.metrics, 'otlp_endpoint', None) if hasattr(self.config, 'metrics') else None
+        if tracing_enabled or otlp_endpoint or os.environ.get('OTEL_EXPORTER_OTLP_ENDPOINT'):
+            try:
+                init_tracing()
+                logger.info("OpenTelemetry tracing initialized")
+            except Exception as e:
+                logger.warning(f"Failed to initialize tracing: {e}")
+        if is_prometheus_available():
+            logger.debug("Prometheus metrics available")
+    def _on_config_reload(self, new_config: Any) -> None:
+        """Handle configuration reload (called on SIGHUP)."""
+        logger.info("Configuration reloaded")
+        self.config = new_config
+        # Re-apply safety mode from new config, honoring CLI precedence
+        self._apply_safety_mode(self._cli_read_only, self._cli_disable_destructive)
+        # Refresh non_destructive flag
+        self.non_destructive = get_safety_mode() != SafetyMode.NORMAL
+        mode_info = get_mode_info()
+        logger.info(f"Safety mode after reload: {mode_info['mode']}")
     def _setup_auth(self) -> Optional[Any]:
         """Set up authentication if enabled."""
         if not self.auth_config.enabled:
@@ -228,8 +358,12 @@ class MCPServer:
         register_resources(self.server)
     def setup_prompts(self):
-        """Set up MCP prompts."""
-        register_prompts(self.server)
+        """Set up MCP prompts from built-in and custom config."""
+        # Get custom prompts path from config if specified
+        prompts_config_path = None
+        if hasattr(self.config, 'prompts') and hasattr(self.config.prompts, 'file'):
+            prompts_config_path = self.config.prompts.file
+        register_prompts(self.server, config_path=prompts_config_path)
     def _check_dependencies(self) -> bool:
         """Check if required dependencies are available."""
@@ -358,17 +492,51 @@ class MCPServer:
         try:
             # FastMCP 3 uses create_sse_app() to create a Starlette ASGI app
             from fastmcp.server.http import create_sse_app
+            from starlette.applications import Starlette
+            from starlette.responses import JSONResponse, PlainTextResponse
+            from starlette.routing import Route, Mount
+            # Create observability endpoints
+            async def health_check(request):
+                return JSONResponse({"status": "healthy", "server": self.name})
+            async def stats_endpoint(request):
+                stats = self._stats.get_stats()
+                return JSONResponse(stats)
+            async def metrics_endpoint(request):
+                if is_prometheus_available():
+                    metrics_text = get_metrics()
+                    return PlainTextResponse(metrics_text, media_type="text/plain; version=0.0.4; charset=utf-8")
+                else:
+                    return PlainTextResponse("# Prometheus metrics not available\n", media_type="text/plain")
+            async def safety_mode_endpoint(request):
+                mode_info = get_mode_info()
+                return JSONResponse(mode_info)
             # Create the SSE Starlette application
             # message_path: POST endpoint for client messages
             # sse_path: GET endpoint for SSE event stream
-            app = create_sse_app(
+            sse_app = create_sse_app(
                 self.server,
                 message_path="/messages/",
                 sse_path="/sse"
             )
+            # Create combined app with SSE and observability endpoints
+            app = Starlette(
+                routes=[
+                    Route("/health", health_check, methods=["GET"]),
+                    Route("/stats", stats_endpoint, methods=["GET"]),
+                    Route("/metrics", metrics_endpoint, methods=["GET"]),
+                    Route("/safety", safety_mode_endpoint, methods=["GET"]),
+                    Mount("/", app=sse_app),  # Mount SSE app at root
+                ]
+            )
             logger.info(f"SSE endpoints: GET /sse (events), POST /messages/ (messages)")
+            logger.info(f"Observability endpoints: GET /health, /stats, /metrics, /safety")
             # Run with uvicorn
             config = uvicorn.Config(app, host=host, port=port, log_level="info")
@@ -498,11 +666,33 @@ class MCPServer:
             """Health check endpoint."""
             return JSONResponse({"status": "healthy", "server": self.name})
+        async def stats_endpoint(request):
+            """Return runtime statistics."""
+            stats = self._stats.get_stats()
+            return JSONResponse(stats)
+        async def metrics_endpoint(request):
+            """Return Prometheus-format metrics."""
+            from starlette.responses import PlainTextResponse
+            if is_prometheus_available():
+                metrics_text = get_metrics()
+                return PlainTextResponse(metrics_text, media_type="text/plain; version=0.0.4; charset=utf-8")
+            else:
+                return PlainTextResponse("# Prometheus metrics not available\n", media_type="text/plain")
+        async def safety_mode_endpoint(request):
+            """Return current safety mode information."""
+            mode_info = get_mode_info()
+            return JSONResponse(mode_info)
         app = Starlette(
             routes=[
                 Route("/", handle_mcp_request, methods=["POST"]),
                 Route("/mcp", handle_mcp_request, methods=["POST"]),
                 Route("/health", health_check, methods=["GET"]),
+                Route("/stats", stats_endpoint, methods=["GET"]),
+                Route("/metrics", metrics_endpoint, methods=["GET"]),
+                Route("/safety", safety_mode_endpoint, methods=["GET"]),
             ]
         )
@@ -535,10 +725,31 @@ if __name__ == "__main__":
         default="0.0.0.0",
         help="Host to bind to for SSE/HTTP transport. Default: 0.0.0.0.",
     )
+    parser.add_argument(
+        "--config",
+        type=str,
+        default=None,
+        help="Path to TOML configuration file.",
+    )
+    parser.add_argument(
+        "--read-only",
+        action="store_true",
+        help="Enable read-only mode (block all write operations).",
+    )
+    parser.add_argument(
+        "--disable-destructive",
+        action="store_true",
+        help="Disable destructive operations (allow create/update, block delete).",
+    )
     args = parser.parse_args()
     server_name = "kubectl_mcp_server"
-    mcp_server = MCPServer(name=server_name)
+    mcp_server = MCPServer(
+        name=server_name,
+        read_only=args.read_only,
+        disable_destructive=args.disable_destructive,
+        config_file=args.config,
+    )
     # Handle signals gracefully with immediate exit
     def signal_handler(sig, frame):

kubectl_mcp_tool/observability/__init__.py ADDED Viewed

@@ -0,0 +1,59 @@
+"""
+Observability module for kubectl-mcp-server.
+Provides:
+- StatsCollector: Runtime statistics and metrics collection
+- Prometheus metrics: Standard Prometheus format metrics
+- OpenTelemetry tracing: Distributed tracing with OTLP export
+Usage:
+    # Stats collection
+    from kubectl_mcp_tool.observability import get_stats_collector
+    stats = get_stats_collector()
+    stats.record_tool_call("get_pods", success=True, duration=0.5)
+    # Prometheus metrics
+    from kubectl_mcp_tool.observability import get_metrics
+    metrics_text = get_metrics()
+    # Tracing
+    from kubectl_mcp_tool.observability import init_tracing, traced_tool_call
+    init_tracing()
+    with traced_tool_call("get_pods") as span:
+        # execute tool
+        pass
+"""
+from .stats import StatsCollector, get_stats_collector
+from .metrics import (
+    get_metrics,
+    record_tool_call_metric,
+    record_tool_error_metric,
+    record_tool_duration_metric,
+    is_prometheus_available,
+)
+from .tracing import (
+    init_tracing,
+    traced_tool_call,
+    get_tracer,
+    is_tracing_available,
+    shutdown_tracing,
+)
+__all__ = [
+    # Stats
+    "StatsCollector",
+    "get_stats_collector",
+    # Metrics
+    "get_metrics",
+    "record_tool_call_metric",
+    "record_tool_error_metric",
+    "record_tool_duration_metric",
+    "is_prometheus_available",
+    # Tracing
+    "init_tracing",
+    "traced_tool_call",
+    "get_tracer",
+    "is_tracing_available",
+    "shutdown_tracing",
+]

kubectl_mcp_tool/observability/metrics.py ADDED Viewed

@@ -0,0 +1,223 @@
+"""
+Prometheus metrics for kubectl-mcp-server.
+Provides standard Prometheus format metrics for production monitoring.
+Metrics exposed:
+- mcp_tool_calls_total: Counter of tool invocations (labels: tool_name, status)
+- mcp_tool_errors_total: Counter of tool errors (labels: tool_name, error_type)
+- mcp_tool_duration_seconds: Histogram of tool call durations (labels: tool_name)
+- mcp_http_requests_total: Counter of HTTP requests (labels: endpoint, method, status)
+- mcp_server_info: Gauge with server metadata
+Requires: prometheus-client>=0.19.0 (optional dependency)
+"""
+import logging
+from typing import Optional
+logger = logging.getLogger(__name__)
+# Check if prometheus_client is available
+_prometheus_available = False
+_REGISTRY = None
+_tool_calls_counter = None
+_tool_errors_counter = None
+_tool_duration_histogram = None
+_http_requests_counter = None
+_server_info_gauge = None
+try:
+    from prometheus_client import (
+        Counter,
+        Histogram,
+        Gauge,
+        CollectorRegistry,
+        generate_latest,
+        CONTENT_TYPE_LATEST,
+    )
+    _prometheus_available = True
+    # Create a custom registry to avoid conflicts
+    _REGISTRY = CollectorRegistry()
+    # Tool call counter
+    _tool_calls_counter = Counter(
+        "mcp_tool_calls_total",
+        "Total number of MCP tool calls",
+        ["tool_name", "status"],
+        registry=_REGISTRY,
+    )
+    # Tool error counter
+    _tool_errors_counter = Counter(
+        "mcp_tool_errors_total",
+        "Total number of MCP tool errors",
+        ["tool_name", "error_type"],
+        registry=_REGISTRY,
+    )
+    # Tool duration histogram
+    # Buckets optimized for typical k8s API call durations
+    _tool_duration_histogram = Histogram(
+        "mcp_tool_duration_seconds",
+        "Duration of MCP tool calls in seconds",
+        ["tool_name"],
+        buckets=(0.01, 0.025, 0.05, 0.1, 0.25, 0.5, 1.0, 2.5, 5.0, 10.0, 30.0),
+        registry=_REGISTRY,
+    )
+    # HTTP requests counter
+    _http_requests_counter = Counter(
+        "mcp_http_requests_total",
+        "Total number of HTTP requests",
+        ["endpoint", "method", "status"],
+        registry=_REGISTRY,
+    )
+    # Server info gauge (version, features)
+    _server_info_gauge = Gauge(
+        "mcp_server_info",
+        "MCP server information",
+        ["version", "transport"],
+        registry=_REGISTRY,
+    )
+    logger.debug("Prometheus metrics initialized successfully")
+except ImportError:
+    logger.debug(
+        "prometheus_client not installed. Prometheus metrics disabled. "
+        "Install with: pip install kubectl-mcp-server[observability]"
+    )
+def is_prometheus_available() -> bool:
+    """Check if Prometheus client is available."""
+    return _prometheus_available
+def record_tool_call_metric(
+    tool_name: str,
+    success: bool = True,
+    duration: float = 0.0
+) -> None:
+    """
+    Record a tool call in Prometheus metrics.
+    Args:
+        tool_name: Name of the tool called
+        success: Whether the call succeeded
+        duration: Call duration in seconds
+    """
+    if not _prometheus_available:
+        return
+    status = "success" if success else "error"
+    _tool_calls_counter.labels(tool_name=tool_name, status=status).inc()
+    if duration > 0:
+        _tool_duration_histogram.labels(tool_name=tool_name).observe(duration)
+def record_tool_error_metric(
+    tool_name: str,
+    error_type: str = "unknown"
+) -> None:
+    """
+    Record a tool error in Prometheus metrics.
+    Args:
+        tool_name: Name of the tool that errored
+        error_type: Type/category of error (e.g., "timeout", "validation", "k8s_api")
+    """
+    if not _prometheus_available:
+        return
+    _tool_errors_counter.labels(
+        tool_name=tool_name,
+        error_type=error_type
+    ).inc()
+def record_tool_duration_metric(tool_name: str, duration: float) -> None:
+    """
+    Record tool duration in Prometheus histogram.
+    Args:
+        tool_name: Name of the tool
+        duration: Duration in seconds
+    """
+    if not _prometheus_available:
+        return
+    _tool_duration_histogram.labels(tool_name=tool_name).observe(duration)
+def record_http_request_metric(
+    endpoint: str,
+    method: str,
+    status: int = 200
+) -> None:
+    """
+    Record an HTTP request in Prometheus metrics.
+    Args:
+        endpoint: Request endpoint path
+        method: HTTP method
+        status: HTTP status code
+    """
+    if not _prometheus_available:
+        return
+    _http_requests_counter.labels(
+        endpoint=endpoint,
+        method=method,
+        status=str(status)
+    ).inc()
+def set_server_info(version: str, transport: str) -> None:
+    """
+    Set server info in Prometheus gauge.
+    Args:
+        version: Server version
+        transport: Transport type (stdio, sse, http)
+    """
+    if not _prometheus_available:
+        return
+    _server_info_gauge.labels(version=version, transport=transport).set(1)
+def get_metrics() -> str:
+    """
+    Get metrics in Prometheus text format.
+    Returns:
+        Prometheus metrics as text, or error message if unavailable
+    """
+    if not _prometheus_available:
+        return (
+            "# Prometheus metrics not available.\n"
+            "# Install with: pip install kubectl-mcp-server[observability]\n"
+        )
+    try:
+        return generate_latest(_REGISTRY).decode("utf-8")
+    except Exception as e:
+        logger.error(f"Error generating Prometheus metrics: {e}")
+        return f"# Error generating metrics: {e}\n"
+def get_metrics_content_type() -> str:
+    """
+    Get the content type for Prometheus metrics.
+    Returns:
+        Prometheus content type string
+    """
+    if not _prometheus_available:
+        return "text/plain; charset=utf-8"
+    return CONTENT_TYPE_LATEST

kubectl-mcp-server 1.16.0__py3-none-any.whl → 1.17.0__py3-none-any.whl

kubectl-mcp-server 1.16.0py3-none-any.whl → 1.17.0py3-none-any.whl