PyPI - mcp-code-indexer - Versions diffs - 2.0.2__py3-none-any.whl → 2.2.0__py3-none-any.whl - Mend

mcp-code-indexer 2.0.2py3-none-any.whl → 2.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

mcp_code_indexer/database/exceptions.py ADDED Viewed

@@ -0,0 +1,303 @@
+"""
+Custom exception hierarchy for SQLite errors with retry classification.
+This module provides structured error handling for database operations,
+with specific exceptions for different types of SQLite errors and
+comprehensive error context for monitoring and debugging.
+"""
+from datetime import datetime, timezone
+from typing import Any, Dict, Optional
+class DatabaseError(Exception):
+    """Base exception for all database-related errors."""
+    def __init__(self, message: str, operation_name: str = "",
+                 error_context: Optional[Dict[str, Any]] = None):
+        self.message = message
+        self.operation_name = operation_name
+        self.error_context = error_context or {}
+        self.timestamp = datetime.now(timezone.utc)
+        super().__init__(f"{operation_name}: {message}" if operation_name else message)
+    def to_dict(self) -> Dict[str, Any]:
+        """Convert exception to dictionary for structured logging."""
+        return {
+            "error_type": self.__class__.__name__,
+            "message": self.message,
+            "operation_name": self.operation_name,
+            "timestamp": self.timestamp.isoformat(),
+            "error_context": self.error_context
+        }
+class DatabaseLockError(DatabaseError):
+    """Exception for SQLite database locking issues that are retryable."""
+    def __init__(self, message: str, retry_count: int = 0, operation_name: str = "",
+                 last_attempt: Optional[datetime] = None, lock_type: str = "unknown"):
+        self.retry_count = retry_count
+        self.last_attempt = last_attempt or datetime.now(timezone.utc)
+        self.lock_type = lock_type  # 'read', 'write', 'exclusive'
+        error_context = {
+            "retry_count": retry_count,
+            "last_attempt": self.last_attempt.isoformat(),
+            "lock_type": lock_type,
+            "retryable": True
+        }
+        super().__init__(message, operation_name, error_context)
+class DatabaseBusyError(DatabaseError):
+    """Exception for SQLite database busy errors that are retryable."""
+    def __init__(self, message: str, operation_name: str = "",
+                 busy_timeout: float = 0.0, resource_type: str = "connection"):
+        self.busy_timeout = busy_timeout
+        self.resource_type = resource_type  # 'connection', 'transaction', 'table'
+        error_context = {
+            "busy_timeout": busy_timeout,
+            "resource_type": resource_type,
+            "retryable": True
+        }
+        super().__init__(message, operation_name, error_context)
+class DatabaseConnectionError(DatabaseError):
+    """Exception for database connection issues."""
+    def __init__(self, message: str, operation_name: str = "",
+                 connection_info: Optional[Dict[str, Any]] = None):
+        self.connection_info = connection_info or {}
+        error_context = {
+            "connection_info": self.connection_info,
+            "retryable": False  # Connection errors usually indicate config issues
+        }
+        super().__init__(message, operation_name, error_context)
+class DatabaseSchemaError(DatabaseError):
+    """Exception for database schema-related errors."""
+    def __init__(self, message: str, operation_name: str = "",
+                 schema_version: Optional[str] = None, migration_info: Optional[Dict] = None):
+        self.schema_version = schema_version
+        self.migration_info = migration_info or {}
+        error_context = {
+            "schema_version": schema_version,
+            "migration_info": self.migration_info,
+            "retryable": False  # Schema errors require manual intervention
+        }
+        super().__init__(message, operation_name, error_context)
+class DatabaseIntegrityError(DatabaseError):
+    """Exception for database integrity constraint violations."""
+    def __init__(self, message: str, operation_name: str = "",
+                 constraint_type: str = "unknown", affected_table: str = ""):
+        self.constraint_type = constraint_type  # 'primary_key', 'foreign_key', 'unique', 'check'
+        self.affected_table = affected_table
+        error_context = {
+            "constraint_type": constraint_type,
+            "affected_table": affected_table,
+            "retryable": False  # Integrity errors indicate data issues
+        }
+        super().__init__(message, operation_name, error_context)
+class DatabaseTimeoutError(DatabaseError):
+    """Exception for database operation timeouts."""
+    def __init__(self, message: str, operation_name: str = "",
+                 timeout_seconds: float = 0.0, operation_type: str = "unknown"):
+        self.timeout_seconds = timeout_seconds
+        self.operation_type = operation_type  # 'read', 'write', 'transaction'
+        error_context = {
+            "timeout_seconds": timeout_seconds,
+            "operation_type": operation_type,
+            "retryable": True  # Timeouts might be transient
+        }
+        super().__init__(message, operation_name, error_context)
+def classify_sqlite_error(error: Exception, operation_name: str = "") -> DatabaseError:
+    """
+    Classify a raw SQLite error into our structured exception hierarchy.
+    Args:
+        error: Original exception from SQLite
+        operation_name: Name of the operation that failed
+    Returns:
+        Appropriate DatabaseError subclass with context
+    """
+    error_message = str(error).lower()
+    original_message = str(error)
+    # Database locking errors
+    if any(msg in error_message for msg in [
+        "database is locked",
+        "sqlite_locked",
+        "attempt to write a readonly database"
+    ]):
+        lock_type = "write" if "write" in error_message or "readonly" in error_message else "read"
+        return DatabaseLockError(
+            original_message,
+            operation_name=operation_name,
+            lock_type=lock_type
+        )
+    # Database busy errors
+    if any(msg in error_message for msg in [
+        "database is busy",
+        "sqlite_busy",
+        "cannot start a transaction within a transaction"
+    ]):
+        resource_type = "transaction" if "transaction" in error_message else "connection"
+        return DatabaseBusyError(
+            original_message,
+            operation_name=operation_name,
+            resource_type=resource_type
+        )
+    # Connection errors
+    if any(msg in error_message for msg in [
+        "unable to open database",
+        "disk i/o error",
+        "database disk image is malformed",
+        "no such database"
+    ]):
+        return DatabaseConnectionError(
+            original_message,
+            operation_name=operation_name
+        )
+    # Schema errors
+    if any(msg in error_message for msg in [
+        "no such table",
+        "no such column",
+        "table already exists",
+        "syntax error"
+    ]):
+        return DatabaseSchemaError(
+            original_message,
+            operation_name=operation_name
+        )
+    # Integrity constraint errors
+    if any(msg in error_message for msg in [
+        "unique constraint failed",
+        "foreign key constraint failed",
+        "primary key constraint failed",
+        "check constraint failed"
+    ]):
+        constraint_type = "unknown"
+        if "unique" in error_message:
+            constraint_type = "unique"
+        elif "foreign key" in error_message:
+            constraint_type = "foreign_key"
+        elif "primary key" in error_message:
+            constraint_type = "primary_key"
+        elif "check" in error_message:
+            constraint_type = "check"
+        return DatabaseIntegrityError(
+            original_message,
+            operation_name=operation_name,
+            constraint_type=constraint_type
+        )
+    # Default to generic database error
+    return DatabaseError(
+        original_message,
+        operation_name=operation_name,
+        error_context={"original_error_type": type(error).__name__}
+    )
+def is_retryable_error(error: Exception) -> bool:
+    """
+    Determine if an error is retryable based on our classification.
+    Args:
+        error: Exception to check
+    Returns:
+        True if the error should trigger a retry
+    """
+    if isinstance(error, DatabaseError):
+        return error.error_context.get("retryable", False)
+    # For raw exceptions, use simple classification
+    error_message = str(error).lower()
+    retryable_patterns = [
+        "database is locked",
+        "database is busy",
+        "sqlite_busy",
+        "sqlite_locked",
+        "cannot start a transaction within a transaction"
+    ]
+    return any(pattern in error_message for pattern in retryable_patterns)
+def get_error_classification_stats(errors: list) -> Dict[str, Any]:
+    """
+    Analyze a list of errors and provide classification statistics.
+    Args:
+        errors: List of Exception objects to analyze
+    Returns:
+        Dictionary with error classification statistics
+    """
+    stats = {
+        "total_errors": len(errors),
+        "error_types": {},
+        "retryable_count": 0,
+        "non_retryable_count": 0,
+        "most_common_errors": {}
+    }
+    error_messages = {}
+    for error in errors:
+        # Classify error
+        classified = classify_sqlite_error(error) if not isinstance(error, DatabaseError) else error
+        error_type = type(classified).__name__
+        # Count by type
+        stats["error_types"][error_type] = stats["error_types"].get(error_type, 0) + 1
+        # Count retryable vs non-retryable
+        if is_retryable_error(classified):
+            stats["retryable_count"] += 1
+        else:
+            stats["non_retryable_count"] += 1
+        # Track common error messages
+        message = str(error)
+        error_messages[message] = error_messages.get(message, 0) + 1
+    # Find most common error messages
+    stats["most_common_errors"] = sorted(
+        error_messages.items(),
+        key=lambda x: x[1],
+        reverse=True
+    )[:5]
+    return stats

mcp_code_indexer/database/retry_executor.py ADDED Viewed

@@ -0,0 +1,359 @@
+"""
+Tenacity-based retry executor for database operations with exponential backoff.
+This module provides a robust retry executor that replaces the broken async
+context manager retry pattern with proper separation of concerns between
+retry logic and resource management.
+"""
+import asyncio
+import logging
+from contextlib import asynccontextmanager
+from dataclasses import dataclass, field
+from datetime import datetime, timedelta, timezone
+from typing import Any, AsyncIterator, Callable, Dict, Optional, Type, TypeVar, Union
+import aiosqlite
+from tenacity import (
+    AsyncRetrying,
+    RetryError,
+    stop_after_attempt,
+    wait_exponential_jitter,
+    retry_if_exception_type,
+    before_sleep_log,
+    after_log
+)
+logger = logging.getLogger(__name__)
+T = TypeVar('T')
+@dataclass
+class RetryConfig:
+    """Configuration for database retry logic using tenacity."""
+    max_attempts: int = 5
+    min_wait_seconds: float = 0.1
+    max_wait_seconds: float = 2.0
+    jitter_max_seconds: float = 0.2  # Max jitter to add
+    retry_on_errors: tuple = field(default_factory=lambda: (aiosqlite.OperationalError,))
+@dataclass
+class RetryStats:
+    """Statistics for retry operations."""
+    total_operations: int = 0
+    successful_operations: int = 0
+    retried_operations: int = 0
+    failed_operations: int = 0
+    total_attempts: int = 0
+    total_retry_time: float = 0.0
+    last_operation_time: Optional[datetime] = None
+    @property
+    def success_rate(self) -> float:
+        """Calculate success rate as percentage."""
+        if self.total_operations == 0:
+            return 0.0
+        return (self.successful_operations / self.total_operations) * 100.0
+    @property
+    def retry_rate(self) -> float:
+        """Calculate retry rate as percentage."""
+        if self.total_operations == 0:
+            return 0.0
+        return (self.retried_operations / self.total_operations) * 100.0
+    @property
+    def average_attempts_per_operation(self) -> float:
+        """Calculate average retry attempts per operation."""
+        if self.total_operations == 0:
+            return 0.0
+        return self.total_attempts / self.total_operations
+class DatabaseLockError(Exception):
+    """Exception for database locking issues with retry context."""
+    def __init__(self, message: str, retry_count: int = 0, operation_name: str = "",
+                 last_attempt: Optional[datetime] = None):
+        self.message = message
+        self.retry_count = retry_count
+        self.operation_name = operation_name
+        self.last_attempt = last_attempt or datetime.now(timezone.utc)
+        super().__init__(f"{operation_name}: {message} (after {retry_count} attempts)")
+class RetryExecutor:
+    """
+    Tenacity-based retry executor for database operations.
+    This executor provides robust retry logic with exponential backoff,
+    proper error classification, and comprehensive statistics tracking.
+    It replaces the broken async context manager retry pattern.
+    """
+    def __init__(self, config: Optional[RetryConfig] = None):
+        """
+        Initialize retry executor.
+        Args:
+            config: Retry configuration, uses defaults if None
+        """
+        self.config = config or RetryConfig()
+        self._stats = RetryStats()
+        self._operation_start_times: Dict[str, datetime] = {}
+        # Configure tenacity retrying with exponential backoff and jitter
+        self._tenacity_retrying = AsyncRetrying(
+            stop=stop_after_attempt(self.config.max_attempts),
+            wait=wait_exponential_jitter(
+                initial=self.config.min_wait_seconds,
+                max=self.config.max_wait_seconds,
+                jitter=self.config.jitter_max_seconds
+            ),
+            retry=self._should_retry_exception,
+            before_sleep=before_sleep_log(logger, logging.WARNING),
+            after=after_log(logger, logging.DEBUG),
+            reraise=False
+        )
+    async def execute_with_retry(self,
+                                 operation: Callable[[], T],
+                                 operation_name: str = "database_operation") -> T:
+        """
+        Execute an operation with retry logic.
+        Args:
+            operation: Async callable to execute
+            operation_name: Name for logging and statistics
+        Returns:
+            Result of the operation
+        Raises:
+            DatabaseLockError: If all retry attempts fail
+            Exception: For non-retryable errors
+        """
+        self._stats.total_operations += 1
+        self._operation_start_times[operation_name] = datetime.now(timezone.utc)
+        attempt_count = 0
+        operation_start = datetime.now(timezone.utc)
+        operation_had_retries = False
+        try:
+            async for attempt in self._tenacity_retrying:
+                with attempt:
+                    attempt_count += 1
+                    self._stats.total_attempts += 1
+                    # Execute the operation
+                    result = await operation()
+                    # Success - update statistics
+                    operation_time = (datetime.now(timezone.utc) - operation_start).total_seconds()
+                    self._stats.successful_operations += 1
+                    self._stats.last_operation_time = datetime.now(timezone.utc)
+                    if attempt_count > 1:
+                        if not operation_had_retries:
+                            self._stats.retried_operations += 1
+                            operation_had_retries = True
+                        self._stats.total_retry_time += operation_time
+                        logger.info(
+                            f"Operation '{operation_name}' succeeded after {attempt_count} attempts",
+                            extra={"structured_data": {
+                                "retry_success": {
+                                    "operation": operation_name,
+                                    "attempts": attempt_count,
+                                    "total_time_seconds": operation_time
+                                }
+                            }}
+                        )
+                    return result
+        except RetryError as e:
+            # All retry attempts exhausted
+            operation_time = (datetime.now(timezone.utc) - operation_start).total_seconds()
+            self._stats.failed_operations += 1
+            self._stats.total_retry_time += operation_time
+            original_error = e.last_attempt.exception()
+            logger.error(
+                f"Operation '{operation_name}' failed after {attempt_count} attempts",
+                extra={"structured_data": {
+                    "retry_exhausted": {
+                        "operation": operation_name,
+                        "max_attempts": self.config.max_attempts,
+                        "total_time_seconds": operation_time,
+                        "final_error": str(original_error)
+                    }
+                }}
+            )
+            raise DatabaseLockError(
+                f"Database operation failed after {attempt_count} attempts: {original_error}",
+                retry_count=attempt_count,
+                operation_name=operation_name,
+                last_attempt=datetime.now(timezone.utc)
+            )
+        except Exception as e:
+            # Non-retryable error on first attempt
+            self._stats.failed_operations += 1
+            logger.error(
+                f"Non-retryable error in '{operation_name}': {e}",
+                extra={"structured_data": {
+                    "immediate_failure": {
+                        "operation": operation_name,
+                        "error_type": type(e).__name__,
+                        "error_message": str(e)
+                    }
+                }}
+            )
+            raise
+        finally:
+            # Clean up tracking
+            self._operation_start_times.pop(operation_name, None)
+    @asynccontextmanager
+    async def get_connection_with_retry(self,
+                                       connection_factory: Callable[[], AsyncIterator[aiosqlite.Connection]],
+                                       operation_name: str = "database_connection") -> AsyncIterator[aiosqlite.Connection]:
+        """
+        Get a database connection with retry logic wrapped around the context manager.
+        This method properly separates retry logic from resource management by
+        retrying the entire context manager operation, not yielding inside a retry loop.
+        Args:
+            connection_factory: Function that returns an async context manager for connections
+            operation_name: Name for logging and statistics
+        Yields:
+            Database connection
+        """
+        async def get_connection():
+            # This function will be retried by execute_with_retry
+            async with connection_factory() as conn:
+                # Store connection for the outer context manager
+                return conn
+        # Use execute_with_retry to handle the retry logic
+        # We create a connection and store it for the context manager
+        connection = await self.execute_with_retry(get_connection, operation_name)
+        try:
+            yield connection
+        finally:
+            # Connection cleanup is handled by the original context manager
+            # in the connection_factory, so nothing to do here
+            pass
+    def _should_retry_exception(self, retry_state) -> bool:
+        """
+        Determine if an exception should trigger a retry.
+        This is used by tenacity to decide whether to retry.
+        Args:
+            retry_state: Tenacity retry state
+        Returns:
+            True if the exception should trigger a retry
+        """
+        if retry_state.outcome is None:
+            return False
+        exception = retry_state.outcome.exception()
+        if exception is None:
+            return False
+        return self._is_sqlite_retryable_error(exception)
+    def _is_sqlite_retryable_error(self, error: Exception) -> bool:
+        """
+        Determine if a SQLite error is retryable.
+        Args:
+            error: Exception to check
+        Returns:
+            True if the error should trigger a retry
+        """
+        if not isinstance(error, self.config.retry_on_errors):
+            return False
+        # Check specific SQLite error messages that indicate transient issues
+        error_message = str(error).lower()
+        retryable_messages = [
+            "database is locked",
+            "database is busy",
+            "cannot start a transaction within a transaction",
+            "sqlite_busy",
+            "sqlite_locked"
+        ]
+        return any(msg in error_message for msg in retryable_messages)
+    def get_retry_stats(self) -> Dict[str, Any]:
+        """
+        Get comprehensive retry statistics.
+        Returns:
+            Dictionary with retry statistics and performance metrics
+        """
+        return {
+            "total_operations": self._stats.total_operations,
+            "successful_operations": self._stats.successful_operations,
+            "retried_operations": self._stats.retried_operations,
+            "failed_operations": self._stats.failed_operations,
+            "total_attempts": self._stats.total_attempts,
+            "success_rate_percent": round(self._stats.success_rate, 2),
+            "retry_rate_percent": round(self._stats.retry_rate, 2),
+            "average_attempts_per_operation": round(self._stats.average_attempts_per_operation, 2),
+            "total_retry_time_seconds": round(self._stats.total_retry_time, 3),
+            "last_operation_time": self._stats.last_operation_time.isoformat() if self._stats.last_operation_time else None,
+            "config": {
+                "max_attempts": self.config.max_attempts,
+                "min_wait_seconds": self.config.min_wait_seconds,
+                "max_wait_seconds": self.config.max_wait_seconds,
+                "jitter_max_seconds": self.config.jitter_max_seconds
+            }
+        }
+    def reset_stats(self) -> None:
+        """Reset retry statistics."""
+        self._stats = RetryStats()
+        self._operation_start_times.clear()
+def create_retry_executor(
+    max_attempts: int = 5,
+    min_wait_seconds: float = 0.1,
+    max_wait_seconds: float = 2.0,
+    jitter_max_seconds: float = 0.2
+) -> RetryExecutor:
+    """
+    Create a configured retry executor for database operations.
+    Args:
+        max_attempts: Maximum retry attempts
+        min_wait_seconds: Initial delay in seconds
+        max_wait_seconds: Maximum delay in seconds
+        jitter_max_seconds: Maximum jitter to add to delays
+    Returns:
+        Configured RetryExecutor instance
+    """
+    config = RetryConfig(
+        max_attempts=max_attempts,
+        min_wait_seconds=min_wait_seconds,
+        max_wait_seconds=max_wait_seconds,
+        jitter_max_seconds=jitter_max_seconds
+    )
+    return RetryExecutor(config)

mcp-code-indexer 2.0.2__py3-none-any.whl → 2.2.0__py3-none-any.whl

mcp-code-indexer 2.0.2py3-none-any.whl → 2.2.0py3-none-any.whl