PyPI - mcp-code-indexer - Versions diffs - 3.1.4__py3-none-any.whl → 3.1.5__py3-none-any.whl - Mend

mcp-code-indexer 3.1.4py3-none-any.whl → 3.1.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

mcp_code_indexer/__init__.py +8 -6
mcp_code_indexer/ask_handler.py +105 -75
mcp_code_indexer/claude_api_handler.py +125 -82
mcp_code_indexer/cleanup_manager.py +107 -81
mcp_code_indexer/database/connection_health.py +212 -161
mcp_code_indexer/database/database.py +529 -415
mcp_code_indexer/database/exceptions.py +167 -118
mcp_code_indexer/database/models.py +54 -19
mcp_code_indexer/database/retry_executor.py +139 -103
mcp_code_indexer/deepask_handler.py +178 -140
mcp_code_indexer/error_handler.py +88 -76
mcp_code_indexer/file_scanner.py +163 -141
mcp_code_indexer/git_hook_handler.py +352 -261
mcp_code_indexer/logging_config.py +76 -94
mcp_code_indexer/main.py +406 -320
mcp_code_indexer/middleware/error_middleware.py +106 -71
mcp_code_indexer/query_preprocessor.py +40 -40
mcp_code_indexer/server/mcp_server.py +785 -470
mcp_code_indexer/token_counter.py +54 -47
{mcp_code_indexer-3.1.4.dist-info → mcp_code_indexer-3.1.5.dist-info}/METADATA +3 -3
mcp_code_indexer-3.1.5.dist-info/RECORD +37 -0
mcp_code_indexer-3.1.4.dist-info/RECORD +0 -37
{mcp_code_indexer-3.1.4.dist-info → mcp_code_indexer-3.1.5.dist-info}/WHEEL +0 -0
{mcp_code_indexer-3.1.4.dist-info → mcp_code_indexer-3.1.5.dist-info}/entry_points.txt +0 -0
{mcp_code_indexer-3.1.4.dist-info → mcp_code_indexer-3.1.5.dist-info}/licenses/LICENSE +0 -0
{mcp_code_indexer-3.1.4.dist-info → mcp_code_indexer-3.1.5.dist-info}/top_level.txt +0 -0

mcp_code_indexer/git_hook_handler.py CHANGED Viewed

@@ -11,48 +11,57 @@ import json
 import logging
 import os
 import subprocess
-import tempfile
 from pathlib import Path
 from typing import Dict, List, Optional, Tuple, Any
 import aiohttp
-from tenacity import retry, wait_exponential, stop_after_attempt, retry_if_exception_type
+from tenacity import (
+    retry,
+    wait_exponential,
+    stop_after_attempt,
+    retry_if_exception_type,
+)
 from .database.database import DatabaseManager
-from .database.models import Project, FileDescription
-from .error_handler import ValidationError
 from .token_counter import TokenCounter
 class GitHookError(Exception):
     """Custom exception for git hook operations."""
     pass
 class ThrottlingError(Exception):
     """Exception for rate limiting scenarios."""
     pass
 class GitHookHandler:
     """
     Handles git hook integration for automated code indexing.
     This class provides functionality to:
     - Analyze git diffs to identify changed files
     - Use OpenRouter API to update file descriptions
     - Update project overview when structural changes occur
     """
     # OpenRouter configuration
     OPENROUTER_API_URL = "https://openrouter.ai/api/v1/chat/completions"
     OPENROUTER_MODEL = "anthropic/claude-sonnet-4"
-    def __init__(self, db_manager: DatabaseManager, cache_dir: Path, logger: Optional[logging.Logger] = None):
+    def __init__(
+        self,
+        db_manager: DatabaseManager,
+        cache_dir: Path,
+        logger: Optional[logging.Logger] = None,
+    ):
         """
         Initialize GitHookHandler.
         Args:
             db_manager: Database manager instance
             cache_dir: Cache directory for temporary files
@@ -62,7 +71,7 @@ class GitHookHandler:
         self.cache_dir = cache_dir
         self.logger = logger if logger is not None else logging.getLogger(__name__)
         self.token_counter = TokenCounter()
         # Git hook specific settings
         self.config = {
             "model": os.getenv("MCP_GITHOOK_MODEL", self.OPENROUTER_MODEL),
@@ -70,123 +79,154 @@ class GitHookHandler:
             "timeout": 300,  # 5 minutes
             "temperature": 0.3,  # Lower temperature for consistent updates
         }
         # Validate OpenRouter API key
         self.api_key = os.getenv("OPENROUTER_API_KEY")
         if not self.api_key:
-            raise GitHookError("OPENROUTER_API_KEY environment variable is required for git hook mode")
+            raise GitHookError(
+                "OPENROUTER_API_KEY environment variable is required for git hook mode"
+            )
     async def run_githook_mode(
-        self,
-        commit_hash: Optional[str] = None,
-        commit_range: Optional[Tuple[str, str]] = None
+        self,
+        commit_hash: Optional[str] = None,
+        commit_range: Optional[Tuple[str, str]] = None,
     ) -> None:
         """
         Run in git hook mode - analyze changes and update descriptions.
         Args:
             commit_hash: Process a specific commit by hash
             commit_range: Process commits in range (start_hash, end_hash)
         This is the main entry point for git hook functionality.
         """
         try:
-            self.logger.info(f"=== Git Hook Analysis Started ===")
+            self.logger.info("=== Git Hook Analysis Started ===")
             if commit_hash:
                 self.logger.info(f"Mode: Single commit ({commit_hash})")
             elif commit_range:
-                self.logger.info(f"Mode: Commit range ({commit_range[0]}..{commit_range[1]})")
+                self.logger.info(
+                    f"Mode: Commit range ({commit_range[0]}..{commit_range[1]})"
+                )
             else:
-                self.logger.info(f"Mode: Staged changes")
+                self.logger.info("Mode: Staged changes")
             # Get git info from current directory
             project_info = await self._identify_project_from_git()
-            self.logger.info(f"Project identified: {project_info.get('name', 'Unknown')} at {project_info.get('folderPath', 'Unknown')}")
+            self.logger.info(
+                f"Project identified: {project_info.get('name', 'Unknown')} "
+                f"at {project_info.get('folderPath', 'Unknown')}"
+            )
             # Get git diff and commit message based on mode
             if commit_hash:
                 git_diff = await self._get_git_diff_for_commit(commit_hash)
                 commit_message = await self._get_commit_message_for_commit(commit_hash)
             elif commit_range:
-                git_diff = await self._get_git_diff_for_range(commit_range[0], commit_range[1])
-                commit_message = await self._get_commit_messages_for_range(commit_range[0], commit_range[1])
+                git_diff = await self._get_git_diff_for_range(
+                    commit_range[0], commit_range[1]
+                )
+                commit_message = await self._get_commit_messages_for_range(
+                    commit_range[0], commit_range[1]
+                )
             else:
                 git_diff = await self._get_git_diff()
                 commit_message = await self._get_commit_message()
             # Log diff details
             if not git_diff:
-                self.logger.info(f"Skipping git hook update - no git diff")
+                self.logger.info("Skipping git hook update - no git diff")
                 return
             diff_tokens = self.token_counter.count_tokens(git_diff)
             self.logger.info(f"Git diff: {diff_tokens} tokens")
             # Fetch current state
             self.logger.info("Fetching current project state...")
             current_overview = await self._get_project_overview(project_info)
             current_descriptions = await self._get_all_descriptions(project_info)
             changed_files = self._extract_changed_files(git_diff)
             if not changed_files:
                 self.logger.info("No changed files detected in git diff")
                 return
-            self.logger.info(f"Found {len(changed_files)} changed files: {', '.join(changed_files)}")
-            overview_tokens = self.token_counter.count_tokens(current_overview) if current_overview else 0
+            self.logger.info(
+                f"Found {len(changed_files)} changed files: {', '.join(changed_files)}"
+            )
+            overview_tokens = (
+                self.token_counter.count_tokens(current_overview)
+                if current_overview
+                else 0
+            )
             self.logger.info(f"Current overview: {overview_tokens} tokens")
             self.logger.info(f"Current descriptions count: {len(current_descriptions)}")
             # Try single-stage first, fall back to two-stage if needed
             updates = await self._analyze_with_smart_staging(
-                git_diff, commit_message, current_overview, current_descriptions, changed_files
+                git_diff,
+                commit_message,
+                current_overview,
+                current_descriptions,
+                changed_files,
             )
             # Apply updates to database
             await self._apply_updates(project_info, updates)
-            self.logger.info(f"Git hook update completed successfully for {len(changed_files)} files")
+            self.logger.info(
+                f"Git hook update completed successfully for {len(changed_files)} files"
+            )
         except Exception as e:
             self.logger.error(f"Git hook mode failed: {e}")
             self.logger.error(f"Exception details: {type(e).__name__}: {str(e)}")
             import traceback
             self.logger.error(f"Full traceback:\n{traceback.format_exc()}")
             # Don't fail the git operation - just log the error
             raise GitHookError(f"Git hook processing failed: {e}")
     async def _analyze_with_smart_staging(
         self,
         git_diff: str,
         commit_message: str,
         current_overview: str,
         current_descriptions: Dict[str, str],
-        changed_files: List[str]
+        changed_files: List[str],
     ) -> Dict[str, Any]:
         """
-        Smart staging: Try single-stage first, fall back to two-stage if token limit exceeded.
+        Smart staging: Try single-stage first, fall back to two-stage if
+        token limit exceeded.
         Args:
             git_diff: Git diff content
             commit_message: Commit message explaining the changes
             current_overview: Current project overview
             current_descriptions: Current file descriptions
             changed_files: List of changed file paths
         Returns:
             Dict containing file_updates and overview_update
         """
         # Build single-stage prompt and check token count
         single_stage_prompt = self._build_single_stage_prompt(
-            git_diff, commit_message, current_overview, current_descriptions, changed_files
+            git_diff,
+            commit_message,
+            current_overview,
+            current_descriptions,
+            changed_files,
         )
         prompt_tokens = self.token_counter.count_tokens(single_stage_prompt)
-        token_limit = self.config.get("max_diff_tokens", 130000)  # Conservative limit under 136k
+        token_limit = self.config.get(
+            "max_diff_tokens", 130000
+        )  # Conservative limit under 136k
         self.logger.info(f"Single-stage prompt: {prompt_tokens} tokens")
         self.logger.info(f"Token limit: {token_limit}")
         if prompt_tokens <= token_limit:
             # Use single-stage approach
             self.logger.info("Using single-stage analysis (within token limit)")
@@ -195,55 +235,60 @@ class GitHookHandler:
             return result
         else:
             # Fall back to two-stage approach
-            self.logger.info(f"Single-stage prompt too large ({prompt_tokens} tokens), falling back to two-stage analysis")
+            self.logger.info(
+                f"Single-stage prompt too large ({prompt_tokens} tokens), "
+                f"falling back to two-stage analysis"
+            )
             # Stage 1: Check if overview needs updating
             overview_updates = await self._analyze_overview_updates(
                 git_diff, commit_message, current_overview, changed_files
             )
-            # Stage 2: Update file descriptions
+            # Stage 2: Update file descriptions
             file_updates = await self._analyze_file_updates(
                 git_diff, commit_message, current_descriptions, changed_files
             )
             # Combine updates
             updates = {
                 "file_updates": file_updates.get("file_updates", {}),
-                "overview_update": overview_updates.get("overview_update")
+                "overview_update": overview_updates.get("overview_update"),
             }
             self.logger.info("Two-stage analysis completed")
             return updates
     def _build_single_stage_prompt(
         self,
         git_diff: str,
         commit_message: str,
         current_overview: str,
         current_descriptions: Dict[str, str],
-        changed_files: List[str]
+        changed_files: List[str],
     ) -> str:
         """
         Build single-stage prompt that handles both overview and file updates.
         Args:
             git_diff: Git diff content
             commit_message: Commit message explaining the changes
             current_overview: Current project overview
             current_descriptions: Current file descriptions
             changed_files: List of changed file paths
         Returns:
             Complete single-stage prompt
         """
         # Only include descriptions for changed files to reduce token usage
         relevant_descriptions = {
-            path: desc for path, desc in current_descriptions.items()
+            path: desc
+            for path, desc in current_descriptions.items()
             if path in changed_files
         }
-        return f"""Analyze this git commit and update both the project overview (if needed) and file descriptions.
+        return f"""Analyze this git commit and update both the project overview
+(if needed) and file descriptions.
 COMMIT MESSAGE:
 {commit_message or "No commit message available"}
@@ -262,18 +307,24 @@ GIT DIFF:
 INSTRUCTIONS:
-1. OVERVIEW UPDATE: Update project overview ONLY if there are major structural changes like:
-   - New major features or components (indicated by commit message or new directories)
+1. OVERVIEW UPDATE: Update project overview ONLY if there are major
+   structural changes like:
+   - New major features or components (indicated by commit message or new
+     directories)
    - Architectural changes (new patterns, frameworks, or approaches)
-   - Significant dependency additions (Cargo.toml, package.json, requirements.txt changes)
+   - Significant dependency additions (Cargo.toml, package.json,
+     requirements.txt changes)
    - New API endpoints or workflows
    - Changes to build/deployment processes
    Do NOT update for: bug fixes, small refactors, documentation updates, version bumps.
-   If updating, provide comprehensive narrative (10-20 pages of text) with directory structure, architecture, components, and workflows.
-2. FILE UPDATES: Update descriptions for files that have changed significantly. Consider both the diff content and commit message context. Only include files that need actual description updates.
+   If updating, provide comprehensive narrative (10-20 pages of text) with
+   directory structure, architecture, components, and workflows.
+2. FILE UPDATES: Update descriptions for files that have changed
+   significantly. Consider both the diff content and commit message context.
+   Only include files that need actual description updates.
 Return ONLY a JSON object:
 {{
@@ -283,51 +334,46 @@ Return ONLY a JSON object:
     "path/to/file2.js": "Updated description for file2"
   }}
 }}"""
     async def _identify_project_from_git(self) -> Dict[str, Any]:
         """
         Identify project information from git repository.
         Returns:
             Dict containing project identification info
         """
         try:
             # Get current working directory as project root
             project_root = Path.cwd()
             # Use directory name as project name
             project_name = project_root.name
-            return {
-                "projectName": project_name,
-                "folderPath": str(project_root)
-            }
+            return {"projectName": project_name, "folderPath": str(project_root)}
         except Exception as e:
             raise GitHookError(f"Failed to identify project from git: {e}")
     async def _get_git_diff(self) -> str:
         """
         Get git diff for recent changes.
         Returns:
             Git diff content as string
         """
         try:
             # Get diff from last commit
-            diff_result = await self._run_git_command([
-                "diff", "--no-color", "--no-ext-diff", "HEAD~1..HEAD"
-            ])
+            diff_result = await self._run_git_command(
+                ["diff", "--no-color", "--no-ext-diff", "HEAD~1..HEAD"]
+            )
             return diff_result
         except subprocess.CalledProcessError:
             # If HEAD~1 doesn't exist (first commit), get diff against empty tree
             try:
-                diff_result = await self._run_git_command([
-                    "diff", "--no-color", "--no-ext-diff", "--cached"
-                ])
+                diff_result = await self._run_git_command(
+                    ["diff", "--no-color", "--no-ext-diff", "--cached"]
+                )
                 return diff_result
             except subprocess.CalledProcessError as e:
                 raise GitHookError(f"Failed to get git diff: {e}")
@@ -335,17 +381,15 @@ Return ONLY a JSON object:
     async def _get_commit_message(self) -> str:
         """
         Get the commit message for context about what was changed.
         Returns:
             Commit message as string
         """
         try:
             # Get the commit message from the latest commit
-            message_result = await self._run_git_command([
-                "log", "-1", "--pretty=%B"
-            ])
+            message_result = await self._run_git_command(["log", "-1", "--pretty=%B"])
             return message_result.strip()
         except subprocess.CalledProcessError:
             # If no commits exist yet, return empty string
             return ""
@@ -353,182 +397,203 @@ Return ONLY a JSON object:
     async def _get_git_diff_for_commit(self, commit_hash: str) -> str:
         """
         Get git diff for a specific commit.
         Args:
             commit_hash: The commit hash to analyze
         Returns:
             Git diff content as string
         """
         try:
             # Get diff for the specific commit compared to its parent
-            diff_result = await self._run_git_command([
-                "diff", "--no-color", "--no-ext-diff", f"{commit_hash}~1..{commit_hash}"
-            ])
+            diff_result = await self._run_git_command(
+                [
+                    "diff",
+                    "--no-color",
+                    "--no-ext-diff",
+                    f"{commit_hash}~1..{commit_hash}",
+                ]
+            )
             return diff_result
         except subprocess.CalledProcessError:
             # If parent doesn't exist (first commit), diff against empty tree
             try:
-                diff_result = await self._run_git_command([
-                    "diff", "--no-color", "--no-ext-diff", "4b825dc642cb6eb9a060e54bf8d69288fbee4904", commit_hash
-                ])
+                diff_result = await self._run_git_command(
+                    [
+                        "diff",
+                        "--no-color",
+                        "--no-ext-diff",
+                        "4b825dc642cb6eb9a060e54bf8d69288fbee4904",
+                        commit_hash,
+                    ]
+                )
                 return diff_result
             except subprocess.CalledProcessError as e:
-                raise GitHookError(f"Failed to get git diff for commit {commit_hash}: {e}")
+                raise GitHookError(
+                    f"Failed to get git diff for commit {commit_hash}: {e}"
+                )
     async def _get_git_diff_for_range(self, start_hash: str, end_hash: str) -> str:
         """
         Get git diff for a range of commits.
         Args:
             start_hash: Starting commit hash (exclusive)
             end_hash: Ending commit hash (inclusive)
         Returns:
             Git diff content as string
         """
         try:
-            diff_result = await self._run_git_command([
-                "diff", "--no-color", "--no-ext-diff", f"{start_hash}..{end_hash}"
-            ])
+            diff_result = await self._run_git_command(
+                ["diff", "--no-color", "--no-ext-diff", f"{start_hash}..{end_hash}"]
+            )
             return diff_result
         except subprocess.CalledProcessError as e:
-            raise GitHookError(f"Failed to get git diff for range {start_hash}..{end_hash}: {e}")
+            raise GitHookError(
+                f"Failed to get git diff for range {start_hash}..{end_hash}: {e}"
+            )
     async def _get_commit_message_for_commit(self, commit_hash: str) -> str:
         """
         Get the commit message for a specific commit.
         Args:
             commit_hash: The commit hash
         Returns:
             Commit message as string
         """
         try:
-            message_result = await self._run_git_command([
-                "log", "-1", "--pretty=%B", commit_hash
-            ])
+            message_result = await self._run_git_command(
+                ["log", "-1", "--pretty=%B", commit_hash]
+            )
             return message_result.strip()
         except subprocess.CalledProcessError as e:
             raise GitHookError(f"Failed to get commit message for {commit_hash}: {e}")
-    async def _get_commit_messages_for_range(self, start_hash: str, end_hash: str) -> str:
+    async def _get_commit_messages_for_range(
+        self, start_hash: str, end_hash: str
+    ) -> str:
         """
         Get commit messages for a range of commits.
         Args:
             start_hash: Starting commit hash (exclusive)
             end_hash: Ending commit hash (inclusive)
         Returns:
             Combined commit messages as string
         """
         try:
             # Get all commit messages in the range
-            message_result = await self._run_git_command([
-                "log", "--pretty=%B", f"{start_hash}..{end_hash}"
-            ])
+            message_result = await self._run_git_command(
+                ["log", "--pretty=%B", f"{start_hash}..{end_hash}"]
+            )
             # Clean up and format the messages
             messages = message_result.strip()
             if messages:
-                return f"Combined commit messages for range {start_hash}..{end_hash}:\n\n{messages}"
+                return (
+                    f"Combined commit messages for range "
+                    f"{start_hash}..{end_hash}:\n\n{messages}"
+                )
             else:
                 return f"No commits found in range {start_hash}..{end_hash}"
         except subprocess.CalledProcessError as e:
-            raise GitHookError(f"Failed to get commit messages for range {start_hash}..{end_hash}: {e}")
+            raise GitHookError(
+                f"Failed to get commit messages for range {start_hash}..{end_hash}: {e}"
+            )
     def _extract_changed_files(self, git_diff: str) -> List[str]:
         """
         Extract list of changed files from git diff.
         Args:
             git_diff: Git diff content
         Returns:
             List of file paths that changed
         """
         changed_files = []
-        lines = git_diff.split('\n')
+        lines = git_diff.split("\n")
         for line in lines:
-            if line.startswith('diff --git a/'):
+            if line.startswith("diff --git a/"):
                 # Parse file path from diff header
                 # Format: diff --git a/path/to/file b/path/to/file
-                parts = line.split(' ')
+                parts = line.split(" ")
                 if len(parts) >= 4:
                     file_path = parts[2][2:]  # Remove 'a/' prefix
                     changed_files.append(file_path)
         return changed_files
     async def _get_project_overview(self, project_info: Dict[str, Any]) -> str:
         """Get current project overview from database."""
         try:
             # Try to find existing project
             project = await self.db_manager.find_matching_project(
-                project_info["projectName"],
-                project_info["folderPath"]
+                project_info["projectName"], project_info["folderPath"]
             )
             if project:
-                overview = await self.db_manager.get_project_overview(
-                    project.id
-                )
+                overview = await self.db_manager.get_project_overview(project.id)
                 return overview.overview if overview else ""
             return ""
         except Exception as e:
             self.logger.warning(f"Failed to get project overview: {e}")
             return ""
-    async def _get_all_descriptions(self, project_info: Dict[str, Any]) -> Dict[str, str]:
+    async def _get_all_descriptions(
+        self, project_info: Dict[str, Any]
+    ) -> Dict[str, str]:
         """Get all current file descriptions from database."""
         try:
             # Try to find existing project
             project = await self.db_manager.find_matching_project(
-                project_info["projectName"],
-                project_info["folderPath"]
+                project_info["projectName"], project_info["folderPath"]
             )
             if project:
                 descriptions = await self.db_manager.get_all_file_descriptions(
                     project.id
                 )
                 return {desc.file_path: desc.description for desc in descriptions}
             return {}
         except Exception as e:
             self.logger.warning(f"Failed to get file descriptions: {e}")
             return {}
     async def _analyze_overview_updates(
         self,
         git_diff: str,
-        commit_message: str,
+        commit_message: str,
         current_overview: str,
-        changed_files: List[str]
+        changed_files: List[str],
     ) -> Dict[str, Any]:
         """
         Stage 1: Analyze if project overview needs updating.
         Args:
             git_diff: Git diff content
             commit_message: Commit message explaining the changes
             current_overview: Current project overview
             changed_files: List of changed file paths
         Returns:
             Dict with overview_update key
         """
         self.logger.info("Stage 1: Analyzing overview updates...")
-        prompt = f"""Analyze this git commit to determine if the project overview needs updating.
+        prompt = f"""Analyze this git commit to determine if the project overview
+needs updating.
 COMMIT MESSAGE:
 {commit_message or "No commit message available"}
@@ -547,13 +612,15 @@ INSTRUCTIONS:
 Update project overview ONLY if there are major structural changes like:
 - New major features or components (indicated by commit message or new directories)
 - Architectural changes (new patterns, frameworks, or approaches)
-- Significant dependency additions (Cargo.toml, package.json, requirements.txt changes)
+- Significant dependency additions (Cargo.toml, package.json,
+  requirements.txt changes)
 - New API endpoints or workflows
 - Changes to build/deployment processes
 Do NOT update for: bug fixes, small refactors, documentation updates, version bumps.
-If updating, provide comprehensive narrative (10-20 pages of text) with directory structure, architecture, components, and workflows.
+If updating, provide comprehensive narrative (10-20 pages of text) with
+directory structure, architecture, components, and workflows.
 Return ONLY a JSON object:
 {{
@@ -563,15 +630,18 @@ Return ONLY a JSON object:
         # Log prompt details
         prompt_tokens = self.token_counter.count_tokens(prompt)
         self.logger.info(f"Stage 1 prompt: {prompt_tokens} tokens")
         if prompt_tokens > self.config["max_diff_tokens"]:
-            self.logger.warning(f"Stage 1 prompt too large ({prompt_tokens} tokens), skipping overview analysis")
+            self.logger.warning(
+                f"Stage 1 prompt too large ({prompt_tokens} tokens), "
+                f"skipping overview analysis"
+            )
             return {"overview_update": None}
         # Call OpenRouter API
         result = await self._call_openrouter(prompt)
         self.logger.info("Stage 1 completed: overview analysis")
         return result
     async def _analyze_file_updates(
@@ -579,29 +649,31 @@ Return ONLY a JSON object:
         git_diff: str,
         commit_message: str,
         current_descriptions: Dict[str, str],
-        changed_files: List[str]
+        changed_files: List[str],
     ) -> Dict[str, Any]:
         """
         Stage 2: Analyze file description updates.
         Args:
             git_diff: Git diff content
             commit_message: Commit message explaining the changes
             current_descriptions: Current file descriptions for changed files only
             changed_files: List of changed file paths
         Returns:
             Dict with file_updates key
         """
         self.logger.info("Stage 2: Analyzing file description updates...")
         # Only include descriptions for changed files to reduce token usage
         relevant_descriptions = {
-            path: desc for path, desc in current_descriptions.items()
+            path: desc
+            for path, desc in current_descriptions.items()
             if path in changed_files
         }
-        prompt = f"""Analyze this git commit and update file descriptions for changed files.
+        prompt = f"""Analyze this git commit and update file descriptions for
+changed files.
 COMMIT MESSAGE:
 {commit_message or "No commit message available"}
@@ -619,7 +691,9 @@ INSTRUCTIONS:
 Use the COMMIT MESSAGE to understand the intent and context of the changes.
-Update descriptions for files that have changed significantly. Consider both the diff content and commit message context. Only include files that need actual description updates.
+Update descriptions for files that have changed significantly. Consider both the
+diff content and commit message context. Only include files that need actual
+description updates.
 Return ONLY a JSON object:
 {{
@@ -629,32 +703,35 @@ Return ONLY a JSON object:
   }}
 }}"""
-        # Log prompt details
+        # Log prompt details
         prompt_tokens = self.token_counter.count_tokens(prompt)
         self.logger.info(f"Stage 2 prompt: {prompt_tokens} tokens")
         if prompt_tokens > self.config["max_diff_tokens"]:
-            self.logger.warning(f"Stage 2 prompt too large ({prompt_tokens} tokens), skipping file analysis")
+            self.logger.warning(
+                f"Stage 2 prompt too large ({prompt_tokens} tokens), "
+                f"skipping file analysis"
+            )
             return {"file_updates": {}}
         # Call OpenRouter API
         result = await self._call_openrouter(prompt)
         self.logger.info("Stage 2 completed: file description analysis")
         return result
     @retry(
         wait=wait_exponential(multiplier=1, min=4, max=60),
         stop=stop_after_attempt(5),
-        retry=retry_if_exception_type(ThrottlingError)
+        retry=retry_if_exception_type(ThrottlingError),
     )
     async def _call_openrouter(self, prompt: str) -> Dict[str, Any]:
         """
         Call OpenRouter API to analyze changes.
         Args:
             prompt: Analysis prompt
         Returns:
             Parsed response with file updates and overview update
         """
@@ -662,114 +739,126 @@ Return ONLY a JSON object:
             "Authorization": f"Bearer {self.api_key}",
             "HTTP-Referer": "https://github.com/fluffypony/mcp-code-indexer",
             "X-Title": "MCP Code Indexer Git Hook",
-            "Content-Type": "application/json"
+            "Content-Type": "application/json",
         }
         payload = {
             "model": self.config["model"],
             "messages": [
                 {
-                    "role": "system",
-                    "content": "You are a technical assistant that analyzes code changes and updates file descriptions accurately and concisely."
+                    "role": "system",
+                    "content": (
+                        "You are a technical assistant that analyzes code "
+                        "changes and updates file descriptions accurately "
+                        "and concisely."
+                    ),
                 },
-                {
-                    "role": "user",
-                    "content": prompt
-                }
+                {"role": "user", "content": prompt},
             ],
             "temperature": self.config["temperature"],
             "max_tokens": 24000,
         }
         timeout = aiohttp.ClientTimeout(total=self.config["timeout"])
-        self.logger.info(f"Sending request to OpenRouter API...")
+        self.logger.info("Sending request to OpenRouter API...")
         self.logger.info(f"  Model: {self.config['model']}")
         self.logger.info(f"  Temperature: {self.config['temperature']}")
-        self.logger.info(f"  Max tokens: 24000")
+        self.logger.info("  Max tokens: 24000")
         self.logger.info(f"  Timeout: {self.config['timeout']}s")
         try:
             async with aiohttp.ClientSession(timeout=timeout) as session:
                 async with session.post(
-                    self.OPENROUTER_API_URL,
-                    headers=headers,
-                    json=payload
+                    self.OPENROUTER_API_URL, headers=headers, json=payload
                 ) as response:
-                    self.logger.info(f"OpenRouter API response status: {response.status}")
+                    self.logger.info(
+                        f"OpenRouter API response status: {response.status}"
+                    )
                     if response.status == 429:
                         retry_after = int(response.headers.get("Retry-After", 60))
-                        self.logger.warning(f"Rate limited by OpenRouter, retry after {retry_after}s")
-                        raise ThrottlingError(f"Rate limited. Retry after {retry_after}s")
+                        self.logger.warning(
+                            f"Rate limited by OpenRouter, retry after {retry_after}s"
+                        )
+                        raise ThrottlingError(
+                            f"Rate limited. Retry after {retry_after}s"
+                        )
                     response.raise_for_status()
                     response_data = await response.json()
                     if "choices" not in response_data:
-                        self.logger.error(f"Invalid API response format: {response_data}")
-                        raise GitHookError(f"Invalid API response format: {response_data}")
+                        self.logger.error(
+                            f"Invalid API response format: {response_data}"
+                        )
+                        raise GitHookError(
+                            f"Invalid API response format: {response_data}"
+                        )
                     content = response_data["choices"][0]["message"]["content"]
-                    self.logger.info(f"OpenRouter response content length: {len(content)} characters")
+                    self.logger.info(
+                        f"OpenRouter response content length: {len(content)} characters"
+                    )
                     return self._validate_githook_response(content)
         except aiohttp.ClientError as e:
             self.logger.error(f"OpenRouter API request failed: {e}")
             self.logger.error(f"ClientError details: {type(e).__name__}: {str(e)}")
             raise GitHookError(f"OpenRouter API request failed: {e}")
-        except asyncio.TimeoutError as e:
-            self.logger.error(f"OpenRouter API request timed out after {self.config['timeout']}s")
+        except asyncio.TimeoutError:
+            self.logger.error(
+                f"OpenRouter API request timed out after {self.config['timeout']}s"
+            )
             raise GitHookError("OpenRouter API request timed out")
     def _validate_githook_response(self, response_text: str) -> Dict[str, Any]:
         """
         Validate and parse JSON response from OpenRouter.
         Args:
             response_text: Raw response content
         Returns:
             Validated response data
         """
         def extract_json_from_response(text: str) -> str:
             """Extract JSON from response that might have extra text before/after."""
             text = text.strip()
             # Try to find JSON in the response
             json_start = -1
             json_end = -1
             # Look for opening brace
             for i, char in enumerate(text):
-                if char == '{':
+                if char == "{":
                     json_start = i
                     break
             if json_start == -1:
                 return text  # No JSON found, return original
             # Find matching closing brace
             brace_count = 0
             for i in range(json_start, len(text)):
-                if text[i] == '{':
+                if text[i] == "{":
                     brace_count += 1
-                elif text[i] == '}':
+                elif text[i] == "}":
                     brace_count -= 1
                     if brace_count == 0:
                         json_end = i + 1
                         break
             if json_end == -1:
                 return text  # No matching brace found, return original
             return text[json_start:json_end]
         try:
             # First try parsing as-is
             try:
@@ -780,47 +869,51 @@ Return ONLY a JSON object:
                 if extracted_json != response_text.strip():
                     self.logger.debug(f"Extracted JSON from response: {extracted_json}")
                 data = json.loads(extracted_json)
             # Handle both single-stage and two-stage responses
             if "file_updates" in data and "overview_update" in data:
                 # Original single-stage format
                 if not isinstance(data["file_updates"], dict):
                     raise ValueError("'file_updates' must be a dictionary")
                 # Validate descriptions
                 for path, desc in data["file_updates"].items():
                     if not isinstance(desc, str) or not desc.strip():
                         raise ValueError(f"Invalid description for {path}")
             elif "file_updates" in data:
                 # Stage 2 format (file updates only)
                 if not isinstance(data["file_updates"], dict):
                     raise ValueError("'file_updates' must be a dictionary")
                 # Validate descriptions
                 for path, desc in data["file_updates"].items():
                     if not isinstance(desc, str) or not desc.strip():
                         raise ValueError(f"Invalid description for {path}")
             elif "overview_update" in data:
                 # Stage 1 format (overview only) - overview_update can be null
                 pass
             else:
-                raise ValueError("Response must contain 'file_updates' and/or 'overview_update'")
+                raise ValueError(
+                    "Response must contain 'file_updates' and/or 'overview_update'"
+                )
             return data
         except json.JSONDecodeError as e:
             self.logger.error(f"Raw response content: {repr(response_text)}")
             raise GitHookError(f"Invalid JSON response from API: {e}")
         except ValueError as e:
             self.logger.error(f"Raw response content: {repr(response_text)}")
             raise GitHookError(f"Invalid response structure: {e}")
-    async def _apply_updates(self, project_info: Dict[str, Any], updates: Dict[str, Any]) -> None:
+    async def _apply_updates(
+        self, project_info: Dict[str, Any], updates: Dict[str, Any]
+    ) -> None:
         """
         Apply updates to database.
         Args:
             project_info: Project identification info
             updates: Updates from OpenRouter API
@@ -828,77 +921,75 @@ Return ONLY a JSON object:
         try:
             # Get or create project
             project = await self.db_manager.get_or_create_project(
-                project_info["projectName"],
-                project_info["folderPath"]
+                project_info["projectName"], project_info["folderPath"]
             )
             # Update file descriptions
             file_updates = updates.get("file_updates", {})
             for file_path, description in file_updates.items():
                 from mcp_code_indexer.database.models import FileDescription
                 from datetime import datetime
                 file_desc = FileDescription(
                     project_id=project.id,
                     file_path=file_path,
                     description=description,
                     file_hash=None,
                     last_modified=datetime.utcnow(),
-                    version=1
+                    version=1,
                 )
                 await self.db_manager.create_file_description(file_desc)
                 self.logger.info(f"Updated description for {file_path}")
             # Update project overview if provided
             overview_update = updates.get("overview_update")
             if overview_update and overview_update.strip():
                 from mcp_code_indexer.database.models import ProjectOverview
                 from datetime import datetime
                 overview = ProjectOverview(
                     project_id=project.id,
                     overview=overview_update,
                     last_modified=datetime.utcnow(),
                     total_files=len(file_updates),
-                    total_tokens=len(overview_update.split())
+                    total_tokens=len(overview_update.split()),
                 )
                 await self.db_manager.create_project_overview(overview)
                 self.logger.info("Updated project overview")
         except Exception as e:
             raise GitHookError(f"Failed to apply updates to database: {e}")
     async def _run_git_command(self, cmd: List[str]) -> str:
         """
         Run a git command and return output.
         Args:
             cmd: Git command arguments
         Returns:
             Command output as string
         """
         full_cmd = ["git"] + cmd
         try:
             process = await asyncio.create_subprocess_exec(
                 *full_cmd,
                 stdout=asyncio.subprocess.PIPE,
                 stderr=asyncio.subprocess.PIPE,
-                cwd=Path.cwd()
+                cwd=Path.cwd(),
             )
             stdout, stderr = await process.communicate()
             if process.returncode != 0:
                 raise subprocess.CalledProcessError(
-                    process.returncode,
-                    full_cmd,
-                    stdout,
-                    stderr
+                    process.returncode, full_cmd, stdout, stderr
                 )
-            return stdout.decode('utf-8')
+            return stdout.decode("utf-8")
         except FileNotFoundError:
-            raise GitHookError("Git command not found - ensure git is installed and in PATH")
+            raise GitHookError(
+                "Git command not found - ensure git is installed and in PATH"
+            )

mcp-code-indexer 3.1.4__py3-none-any.whl → 3.1.5__py3-none-any.whl

mcp-code-indexer 3.1.4py3-none-any.whl → 3.1.5py3-none-any.whl