PyPI - mcp-code-indexer - Versions diffs - 1.9.1__py3-none-any.whl → 2.0.1__py3-none-any.whl - Mend

mcp-code-indexer 1.9.1py3-none-any.whl → 2.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

mcp_code_indexer/database/retry_handler.py ADDED Viewed

@@ -0,0 +1,344 @@
+"""
+Database retry handling for SQLite locking scenarios.
+This module provides specialized retry logic for database operations that may
+encounter locking issues in high-concurrency environments.
+"""
+import asyncio
+import logging
+import random
+import time
+from contextlib import asynccontextmanager
+from dataclasses import dataclass
+from typing import Any, AsyncIterator, Callable, Optional, Type, Union
+from datetime import datetime
+import aiosqlite
+logger = logging.getLogger(__name__)
+@dataclass
+class RetryConfig:
+    """Configuration for database retry logic."""
+    max_attempts: int = 5
+    initial_delay: float = 0.1  # seconds
+    max_delay: float = 2.0      # seconds
+    backoff_multiplier: float = 2.0
+    jitter: bool = True
+    retry_on_error_types: tuple = (aiosqlite.OperationalError,)
+class DatabaseLockError(Exception):
+    """Exception for database locking issues."""
+    def __init__(self, message: str, retry_count: int = 0, last_attempt: Optional[datetime] = None):
+        self.message = message
+        self.retry_count = retry_count
+        self.last_attempt = last_attempt or datetime.utcnow()
+        super().__init__(message)
+class RetryHandler:
+    """Handles database operation retries with exponential backoff."""
+    def __init__(self, config: Optional[RetryConfig] = None):
+        """
+        Initialize retry handler.
+        Args:
+            config: Retry configuration, uses defaults if None
+        """
+        self.config = config or RetryConfig()
+        self._retry_stats = {
+            "total_attempts": 0,
+            "successful_retries": 0,
+            "failed_operations": 0,
+            "avg_retry_delay": 0.0
+        }
+    @asynccontextmanager
+    async def with_retry(self, operation_name: str = "database_operation") -> AsyncIterator[None]:
+        """
+        Context manager that provides retry logic for database operations.
+        Args:
+            operation_name: Name of the operation for logging
+        Usage:
+            async with retry_handler.with_retry("create_project"):
+                # Your database operation here
+                await db.execute(...)
+        """
+        last_error = None
+        total_delay = 0.0
+        for attempt in range(1, self.config.max_attempts + 1):
+            self._retry_stats["total_attempts"] += 1
+            try:
+                yield
+                # Success - log if this was a retry
+                if attempt > 1:
+                    self._retry_stats["successful_retries"] += 1
+                    logger.info(
+                        f"Database operation '{operation_name}' succeeded on attempt {attempt}",
+                        extra={
+                            "structured_data": {
+                                "retry_success": {
+                                    "operation": operation_name,
+                                    "attempt": attempt,
+                                    "total_delay": total_delay
+                                }
+                            }
+                        }
+                    )
+                return
+            except Exception as e:
+                last_error = e
+                # Check if this is a retryable error
+                if not self._is_retryable_error(e):
+                    logger.error(
+                        f"Non-retryable error in '{operation_name}': {e}",
+                        extra={
+                            "structured_data": {
+                                "non_retryable_error": {
+                                    "operation": operation_name,
+                                    "error_type": type(e).__name__,
+                                    "error_message": str(e)
+                                }
+                            }
+                        }
+                    )
+                    raise
+                # If this is the last attempt, give up
+                if attempt >= self.config.max_attempts:
+                    self._retry_stats["failed_operations"] += 1
+                    logger.error(
+                        f"Database operation '{operation_name}' failed after {attempt} attempts",
+                        extra={
+                            "structured_data": {
+                                "retry_exhausted": {
+                                    "operation": operation_name,
+                                    "max_attempts": self.config.max_attempts,
+                                    "total_delay": total_delay,
+                                    "final_error": str(e)
+                                }
+                            }
+                        }
+                    )
+                    raise DatabaseLockError(
+                        f"Database operation failed after {attempt} attempts: {e}",
+                        retry_count=attempt,
+                        last_attempt=datetime.utcnow()
+                    )
+                # Calculate delay for next attempt
+                delay = self._calculate_delay(attempt)
+                total_delay += delay
+                logger.warning(
+                    f"Database operation '{operation_name}' failed on attempt {attempt}, retrying in {delay:.2f}s",
+                    extra={
+                        "structured_data": {
+                            "retry_attempt": {
+                                "operation": operation_name,
+                                "attempt": attempt,
+                                "delay_seconds": delay,
+                                "error_type": type(e).__name__,
+                                "error_message": str(e)
+                            }
+                        }
+                    }
+                )
+                # Wait before retry
+                await asyncio.sleep(delay)
+    def _is_retryable_error(self, error: Exception) -> bool:
+        """
+        Determine if an error is retryable.
+        Args:
+            error: Exception to check
+        Returns:
+            True if the error should trigger a retry
+        """
+        # Check error type
+        if not isinstance(error, self.config.retry_on_error_types):
+            return False
+        # Check specific SQLite error messages
+        error_message = str(error).lower()
+        retryable_messages = [
+            "database is locked",
+            "database is busy",
+            "cannot start a transaction within a transaction",
+            "sqlite_busy",
+            "sqlite_locked"
+        ]
+        return any(msg in error_message for msg in retryable_messages)
+    def _calculate_delay(self, attempt: int) -> float:
+        """
+        Calculate delay for retry attempt with exponential backoff and jitter.
+        Args:
+            attempt: Current attempt number (1-based)
+        Returns:
+            Delay in seconds
+        """
+        # Exponential backoff: initial_delay * (multiplier ^ (attempt - 1))
+        delay = self.config.initial_delay * (self.config.backoff_multiplier ** (attempt - 1))
+        # Cap at max delay
+        delay = min(delay, self.config.max_delay)
+        # Add jitter to prevent thundering herd
+        if self.config.jitter:
+            jitter_range = delay * 0.1  # 10% jitter
+            delay += random.uniform(-jitter_range, jitter_range)
+        # Ensure delay is positive
+        return max(0.0, delay)
+    def get_retry_stats(self) -> dict:
+        """
+        Get retry statistics.
+        Returns:
+            Dictionary with retry statistics
+        """
+        if self._retry_stats["successful_retries"] > 0:
+            self._retry_stats["avg_retry_delay"] = (
+                self._retry_stats["total_attempts"] / self._retry_stats["successful_retries"]
+            )
+        return self._retry_stats.copy()
+    def reset_stats(self) -> None:
+        """Reset retry statistics."""
+        self._retry_stats = {
+            "total_attempts": 0,
+            "successful_retries": 0,
+            "failed_operations": 0,
+            "avg_retry_delay": 0.0
+        }
+class ConnectionRecoveryManager:
+    """Manages database connection recovery for persistent failures."""
+    def __init__(self, database_manager):
+        """
+        Initialize connection recovery manager.
+        Args:
+            database_manager: DatabaseManager instance to manage
+        """
+        self.database_manager = database_manager
+        self._recovery_stats = {
+            "pool_refreshes": 0,
+            "last_refresh": None,
+            "consecutive_failures": 0
+        }
+        self._failure_threshold = 3  # Refresh pool after 3 consecutive failures
+    async def handle_persistent_failure(self, operation_name: str, error: Exception) -> bool:
+        """
+        Handle persistent database failures by attempting pool refresh.
+        Args:
+            operation_name: Name of the failing operation
+            error: The persistent error
+        Returns:
+            True if pool refresh was attempted, False otherwise
+        """
+        self._recovery_stats["consecutive_failures"] += 1
+        # Only refresh if we've hit the threshold
+        if self._recovery_stats["consecutive_failures"] >= self._failure_threshold:
+            logger.warning(
+                f"Attempting connection pool refresh after {self._recovery_stats['consecutive_failures']} failures",
+                extra={
+                    "structured_data": {
+                        "pool_recovery": {
+                            "operation": operation_name,
+                            "consecutive_failures": self._recovery_stats["consecutive_failures"],
+                            "trigger_error": str(error)
+                        }
+                    }
+                }
+            )
+            await self._refresh_connection_pool()
+            return True
+        return False
+    def reset_failure_count(self) -> None:
+        """Reset consecutive failure count after successful operation."""
+        self._recovery_stats["consecutive_failures"] = 0
+    async def _refresh_connection_pool(self) -> None:
+        """
+        Refresh the database connection pool by closing all connections.
+        This forces creation of new connections on next access.
+        """
+        try:
+            # Close existing pool
+            await self.database_manager.close_pool()
+            # Update stats
+            self._recovery_stats["pool_refreshes"] += 1
+            self._recovery_stats["last_refresh"] = datetime.utcnow()
+            self._recovery_stats["consecutive_failures"] = 0
+            logger.info("Database connection pool refreshed successfully")
+        except Exception as e:
+            logger.error(f"Failed to refresh connection pool: {e}")
+            raise
+    def get_recovery_stats(self) -> dict:
+        """
+        Get connection recovery statistics.
+        Returns:
+            Dictionary with recovery statistics
+        """
+        return self._recovery_stats.copy()
+def create_retry_handler(
+    max_attempts: int = 5,
+    initial_delay: float = 0.1,
+    max_delay: float = 2.0
+) -> RetryHandler:
+    """
+    Create a configured retry handler for database operations.
+    Args:
+        max_attempts: Maximum retry attempts
+        initial_delay: Initial delay in seconds
+        max_delay: Maximum delay in seconds
+    Returns:
+        Configured RetryHandler instance
+    """
+    config = RetryConfig(
+        max_attempts=max_attempts,
+        initial_delay=initial_delay,
+        max_delay=max_delay
+    )
+    return RetryHandler(config)

mcp_code_indexer/logging_config.py CHANGED Viewed

@@ -255,6 +255,35 @@ def log_performance_metrics(
     )
+def log_database_metrics(
+    logger: logging.Logger,
+    operation_name: str,
+    metrics: dict,
+    health_status: Optional[dict] = None
+) -> None:
+    """
+    Log database performance and health metrics.
+    Args:
+        logger: Logger instance
+        operation_name: Name of the database operation
+        metrics: Database performance metrics
+        health_status: Current health status (optional)
+    """
+    log_data = {
+        "operation": operation_name,
+        "metrics": metrics
+    }
+    if health_status:
+        log_data["health_status"] = health_status
+    logger.info(
+        f"Database metrics for {operation_name}",
+        extra={"structured_data": {"database_metrics": log_data}}
+    )
 def log_tool_usage(
     logger: logging.Logger,
     tool_name: str,

mcp_code_indexer/middleware/error_middleware.py CHANGED Viewed

@@ -10,6 +10,7 @@ import functools
 import time
 from typing import Any, Callable, Dict, List
+import aiosqlite
 from mcp import types
 from mcp_code_indexer.error_handler import ErrorHandler, MCPError
@@ -77,6 +78,22 @@ class ToolMiddleware:
                 except Exception as e:
                     duration = time.time() - start_time
+                    # Enhanced SQLite error handling
+                    if self._is_database_locking_error(e):
+                        logger.warning(
+                            f"Database locking error in tool {tool_name}: {e}",
+                            extra={
+                                "structured_data": {
+                                    "database_locking_error": {
+                                        "tool_name": tool_name,
+                                        "error_type": type(e).__name__,
+                                        "error_message": str(e),
+                                        "duration": duration
+                                    }
+                                }
+                            }
+                        )
                     # Log the error
                     self.error_handler.log_error(
                         e,
@@ -143,6 +160,30 @@ class ToolMiddleware:
             return wrapper
         return decorator
+    def _is_database_locking_error(self, error: Exception) -> bool:
+        """
+        Check if an error is related to database locking.
+        Args:
+            error: Exception to check
+        Returns:
+            True if this is a database locking error
+        """
+        # Check for SQLite locking errors
+        if isinstance(error, aiosqlite.OperationalError):
+            error_message = str(error).lower()
+            locking_keywords = [
+                "database is locked",
+                "database is busy",
+                "sqlite_busy",
+                "sqlite_locked",
+                "cannot start a transaction within a transaction"
+            ]
+            return any(keyword in error_message for keyword in locking_keywords)
+        return False
 class AsyncTaskManager:

mcp_code_indexer/server/mcp_server.py CHANGED Viewed

@@ -49,7 +49,12 @@ class MCPCodeIndexServer:
         self,
         token_limit: int = 32000,
         db_path: Optional[Path] = None,
-        cache_dir: Optional[Path] = None
+        cache_dir: Optional[Path] = None,
+        db_pool_size: int = 3,
+        db_retry_count: int = 5,
+        db_timeout: float = 10.0,
+        enable_wal_mode: bool = True,
+        health_check_interval: float = 30.0
     ):
         """
         Initialize the MCP Code Index Server.
@@ -58,13 +63,34 @@ class MCPCodeIndexServer:
             token_limit: Maximum tokens before recommending search over overview
             db_path: Path to SQLite database
             cache_dir: Directory for caching
+            db_pool_size: Database connection pool size
+            db_retry_count: Maximum database operation retry attempts
+            db_timeout: Database transaction timeout in seconds
+            enable_wal_mode: Enable WAL mode for better concurrent access
+            health_check_interval: Database health check interval in seconds
         """
         self.token_limit = token_limit
         self.db_path = db_path or Path.home() / ".mcp-code-index" / "tracker.db"
         self.cache_dir = cache_dir or Path.home() / ".mcp-code-index" / "cache"
+        # Store database configuration
+        self.db_config = {
+            "pool_size": db_pool_size,
+            "retry_count": db_retry_count,
+            "timeout": db_timeout,
+            "enable_wal_mode": enable_wal_mode,
+            "health_check_interval": health_check_interval
+        }
         # Initialize components
-        self.db_manager = DatabaseManager(self.db_path)
+        self.db_manager = DatabaseManager(
+            db_path=self.db_path,
+            pool_size=db_pool_size,
+            retry_count=db_retry_count,
+            timeout=db_timeout,
+            enable_wal_mode=enable_wal_mode,
+            health_check_interval=health_check_interval
+        )
         self.token_counter = TokenCounter(token_limit)
         self.merge_handler = MergeHandler(self.db_manager)
@@ -431,6 +457,15 @@ src/
                         "required": ["projectName", "folderPath", "branch"],
                         "additionalProperties": False
                     }
+                ),
+                types.Tool(
+                    name="check_database_health",
+                    description="Perform health diagnostics for the MCP Code Indexer's SQLite database and connection pool. Returns database resilience metrics, connection pool status, WAL mode performance, and file description storage statistics for monitoring the code indexer's database locking improvements.",
+                    inputSchema={
+                        "type": "object",
+                        "properties": {},
+                        "additionalProperties": False
+                    }
                 )
             ]
@@ -455,6 +490,7 @@ src/
                 "update_codebase_overview": self._handle_update_codebase_overview,
                 "get_word_frequency": self._handle_get_word_frequency,
                 "merge_branch_descriptions": self._handle_merge_branch_descriptions,
+                "check_database_health": self._handle_check_database_health,
             }
             if name not in tool_handlers:
@@ -1157,6 +1193,24 @@ src/
             "totalUniqueTerms": result.total_unique_terms
         }
+    async def _handle_check_database_health(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
+        """Handle check_database_health tool calls."""
+        # Get comprehensive database health and statistics
+        health_check = await self.db_manager.check_health()
+        database_stats = self.db_manager.get_database_stats()
+        return {
+            "health_check": health_check,
+            "database_stats": database_stats,
+            "configuration": self.db_config,
+            "server_info": {
+                "token_limit": self.token_limit,
+                "db_path": str(self.db_path),
+                "cache_dir": str(self.cache_dir)
+            },
+            "timestamp": datetime.utcnow().isoformat()
+        }
     async def _run_session_with_retry(self, read_stream, write_stream, initialization_options) -> None:
         """Run a single MCP session with error handling and retry logic."""
         max_retries = 3

{mcp_code_indexer-1.9.1.dist-info → mcp_code_indexer-2.0.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: mcp-code-indexer
-Version: 1.9.1
+Version: 2.0.1
 Summary: MCP server that tracks file descriptions across codebases, enabling AI agents to efficiently navigate and understand code through searchable summaries and token-aware overviews.
 Author: MCP Code Indexer Contributors
 Maintainer: MCP Code Indexer Contributors
@@ -59,11 +59,11 @@ Dynamic: requires-python
 # MCP Code Indexer 🚀
-[![PyPI version](https://badge.fury.io/py/mcp-code-indexer.svg?10)](https://badge.fury.io/py/mcp-code-indexer)
-[![Python](https://img.shields.io/pypi/pyversions/mcp-code-indexer.svg?10)](https://pypi.org/project/mcp-code-indexer/)
+[![PyPI version](https://badge.fury.io/py/mcp-code-indexer.svg?12)](https://badge.fury.io/py/mcp-code-indexer)
+[![Python](https://img.shields.io/pypi/pyversions/mcp-code-indexer.svg?12)](https://pypi.org/project/mcp-code-indexer/)
 [![License](https://img.shields.io/badge/License-MIT-blue.svg)](https://opensource.org/licenses/MIT)
-A production-ready **Model Context Protocol (MCP) server** that revolutionizes how AI agents navigate and understand codebases. Instead of repeatedly scanning files, agents get instant access to intelligent descriptions, semantic search, and context-aware recommendations.
+A production-ready **Model Context Protocol (MCP) server** that revolutionizes how AI agents navigate and understand codebases. Built for high-concurrency environments with advanced database resilience, the server provides instant access to intelligent descriptions, semantic search, and context-aware recommendations while maintaining 800+ writes/sec throughput.
 ## 🎯 What It Does
@@ -227,7 +227,7 @@ mypy src/
 ## 🛠️ MCP Tools Available
-The server provides **11 powerful MCP tools** for intelligent codebase management. Whether you're an AI agent or human developer, these tools make navigating code effortless.
+The server provides **12 powerful MCP tools** for intelligent codebase management. Whether you're an AI agent or human developer, these tools make navigating code effortless.
 ### 🎯 For Everyone: Start Here
 - **`check_codebase_size`** - Get instant recommendations for how to navigate your codebase
@@ -246,6 +246,9 @@ The server provides **11 powerful MCP tools** for intelligent codebase managemen
 - **`merge_branch_descriptions`** - Two-phase merge with conflict resolution
 - **`update_codebase_overview`** - Create comprehensive codebase documentation
+### 🏥 For System Monitoring: Health & Performance
+- **`check_database_health`** - Real-time database health monitoring and diagnostics
 💡 **Pro Tip**: Always start with `check_codebase_size` to get personalized recommendations for navigating your specific codebase.
 ## 🔗 Git Hook Integration
@@ -272,24 +275,29 @@ See the **[Git Hook Setup Guide](docs/git-hook-setup.md)** for complete installa
 ## 🏗️ Architecture Highlights
-### Performance Optimized
-- **SQLite with WAL mode** for high-concurrency access
-- **Connection pooling** for efficient database operations
-- **FTS5 full-text search** with prefix indexing
+### 🚀 Performance Optimized
+- **SQLite with WAL mode** for high-concurrency access (800+ writes/sec)
+- **Smart connection pooling** with optimized pool size (3 connections default)
+- **FTS5 full-text search** with prefix indexing for sub-100ms queries
 - **Token-aware caching** to minimize expensive operations
+- **Write operation serialization** to eliminate database lock conflicts
-### Production Ready
-- **Comprehensive error handling** with structured JSON logging
+### 🛡️ Production Ready
+- **Database resilience features** with <2% error rate under high load
+- **Exponential backoff retry logic** with intelligent failure recovery
+- **Comprehensive health monitoring** with automatic pool refresh
+- **Structured JSON logging** with performance metrics tracking
 - **Async-first design** with proper resource cleanup
 - **MCP protocol compliant** with clean stdio streams
 - **Upstream inheritance** for fork workflows
 - **Git integration** with .gitignore support
-### Developer Friendly
-- **95%+ test coverage** with async support
-- **Integration tests** for complete workflows
-- **Performance benchmarks** for large codebases
+### 👨‍💻 Developer Friendly
+- **95%+ test coverage** with async support and concurrent access tests
+- **Integration tests** for complete workflows including database stress testing
+- **Performance benchmarks** for large codebases with resilience validation
 - **Clear error messages** with MCP protocol compliance
+- **Comprehensive configuration options** for production tuning
 ## 📖 Documentation
@@ -300,6 +308,11 @@ See the **[Git Hook Setup Guide](docs/git-hook-setup.md)** for complete installa
 ### 👨‍💻 For Developers
 - **[API Reference](docs/api-reference.md)** - Complete MCP tool documentation with examples
 - **[Architecture Overview](docs/architecture.md)** - Technical deep dive into system design
+- **[Database Resilience Guide](docs/database-resilience.md)** - Advanced database optimization and monitoring
+### 🔧 For System Administrators
+- **[Performance Tuning Guide](docs/performance-tuning.md)** - High-concurrency deployment optimization
+- **[Monitoring & Diagnostics](docs/monitoring.md)** - Production monitoring setup and troubleshooting
 ### 🤝 For Contributors
 - **[Contributing Guide](docs/contributing.md)** - Development setup and workflow guidelines
@@ -321,6 +334,8 @@ Tested with codebases up to **10,000 files**:
 ## 🔧 Advanced Configuration
+### 👨‍💻 For Developers: Basic Configuration
 ```bash
 # Production setup with custom limits
 mcp-code-indexer \
@@ -334,6 +349,44 @@ export MCP_LOG_FORMAT=json
 mcp-code-indexer
 ```
+### 🔧 For System Administrators: Database Resilience Tuning
+Configure advanced database resilience features for high-concurrency environments:
+```bash
+# High-performance production deployment
+mcp-code-indexer \
+  --token-limit 64000 \
+  --db-path /data/mcp-index.db \
+  --cache-dir /var/cache/mcp \
+  --log-level INFO \
+  --db-pool-size 5 \
+  --db-retry-count 7 \
+  --db-timeout 15.0 \
+  --enable-wal-mode \
+  --health-check-interval 20.0
+# Environment variable configuration
+export DB_POOL_SIZE=5
+export DB_RETRY_COUNT=7
+export DB_TIMEOUT=15.0
+export DB_WAL_MODE=true
+export DB_HEALTH_CHECK_INTERVAL=20.0
+mcp-code-indexer --token-limit 64000
+```
+#### Configuration Options
+| Parameter | Default | Description | Use Case |
+|-----------|---------|-------------|----------|
+| `--db-pool-size` | 3 | Database connection pool size | Higher for more concurrent clients |
+| `--db-retry-count` | 5 | Max retry attempts for failed operations | Increase for unstable environments |
+| `--db-timeout` | 10.0 | Transaction timeout (seconds) | Increase for large operations |
+| `--enable-wal-mode` | true | Enable WAL mode for concurrency | Always enable for production |
+| `--health-check-interval` | 30.0 | Health monitoring interval (seconds) | Lower for faster issue detection |
+💡 **Performance Tip**: For environments with 10+ concurrent clients, use `--db-pool-size 5` and `--health-check-interval 15.0` for optimal throughput.
 ## 🤝 Integration Examples
 ### With AI Agents

mcp-code-indexer 1.9.1__py3-none-any.whl → 2.0.1__py3-none-any.whl

mcp-code-indexer 1.9.1py3-none-any.whl → 2.0.1py3-none-any.whl