PyPI - mcp-vector-search - Versions diffs - 0.12.6__py3-none-any.whl → 1.1.22__py3-none-any.whl - Mend

mcp-vector-search 0.12.6py3-none-any.whl → 1.1.22py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (92) hide show

mcp_vector_search/__init__.py +3 -3
mcp_vector_search/analysis/__init__.py +111 -0
mcp_vector_search/analysis/baseline/__init__.py +68 -0
mcp_vector_search/analysis/baseline/comparator.py +462 -0
mcp_vector_search/analysis/baseline/manager.py +621 -0
mcp_vector_search/analysis/collectors/__init__.py +74 -0
mcp_vector_search/analysis/collectors/base.py +164 -0
mcp_vector_search/analysis/collectors/cohesion.py +463 -0
mcp_vector_search/analysis/collectors/complexity.py +743 -0
mcp_vector_search/analysis/collectors/coupling.py +1162 -0
mcp_vector_search/analysis/collectors/halstead.py +514 -0
mcp_vector_search/analysis/collectors/smells.py +325 -0
mcp_vector_search/analysis/debt.py +516 -0
mcp_vector_search/analysis/interpretation.py +685 -0
mcp_vector_search/analysis/metrics.py +414 -0
mcp_vector_search/analysis/reporters/__init__.py +7 -0
mcp_vector_search/analysis/reporters/console.py +646 -0
mcp_vector_search/analysis/reporters/markdown.py +480 -0
mcp_vector_search/analysis/reporters/sarif.py +377 -0
mcp_vector_search/analysis/storage/__init__.py +93 -0
mcp_vector_search/analysis/storage/metrics_store.py +762 -0
mcp_vector_search/analysis/storage/schema.py +245 -0
mcp_vector_search/analysis/storage/trend_tracker.py +560 -0
mcp_vector_search/analysis/trends.py +308 -0
mcp_vector_search/analysis/visualizer/__init__.py +90 -0
mcp_vector_search/analysis/visualizer/d3_data.py +534 -0
mcp_vector_search/analysis/visualizer/exporter.py +484 -0
mcp_vector_search/analysis/visualizer/html_report.py +2895 -0
mcp_vector_search/analysis/visualizer/schemas.py +525 -0
mcp_vector_search/cli/commands/analyze.py +1062 -0
mcp_vector_search/cli/commands/chat.py +1455 -0
mcp_vector_search/cli/commands/index.py +621 -5
mcp_vector_search/cli/commands/index_background.py +467 -0
mcp_vector_search/cli/commands/init.py +13 -0
mcp_vector_search/cli/commands/install.py +597 -335
mcp_vector_search/cli/commands/install_old.py +8 -4
mcp_vector_search/cli/commands/mcp.py +78 -6
mcp_vector_search/cli/commands/reset.py +68 -26
mcp_vector_search/cli/commands/search.py +224 -8
mcp_vector_search/cli/commands/setup.py +1184 -0
mcp_vector_search/cli/commands/status.py +339 -5
mcp_vector_search/cli/commands/uninstall.py +276 -357
mcp_vector_search/cli/commands/visualize/__init__.py +39 -0
mcp_vector_search/cli/commands/visualize/cli.py +292 -0
mcp_vector_search/cli/commands/visualize/exporters/__init__.py +12 -0
mcp_vector_search/cli/commands/visualize/exporters/html_exporter.py +33 -0
mcp_vector_search/cli/commands/visualize/exporters/json_exporter.py +33 -0
mcp_vector_search/cli/commands/visualize/graph_builder.py +647 -0
mcp_vector_search/cli/commands/visualize/layout_engine.py +469 -0
mcp_vector_search/cli/commands/visualize/server.py +600 -0
mcp_vector_search/cli/commands/visualize/state_manager.py +428 -0
mcp_vector_search/cli/commands/visualize/templates/__init__.py +16 -0
mcp_vector_search/cli/commands/visualize/templates/base.py +234 -0
mcp_vector_search/cli/commands/visualize/templates/scripts.py +4542 -0
mcp_vector_search/cli/commands/visualize/templates/styles.py +2522 -0
mcp_vector_search/cli/didyoumean.py +27 -2
mcp_vector_search/cli/main.py +127 -160
mcp_vector_search/cli/output.py +158 -13
mcp_vector_search/config/__init__.py +4 -0
mcp_vector_search/config/default_thresholds.yaml +52 -0
mcp_vector_search/config/settings.py +12 -0
mcp_vector_search/config/thresholds.py +273 -0
mcp_vector_search/core/__init__.py +16 -0
mcp_vector_search/core/auto_indexer.py +3 -3
mcp_vector_search/core/boilerplate.py +186 -0
mcp_vector_search/core/config_utils.py +394 -0
mcp_vector_search/core/database.py +406 -94
mcp_vector_search/core/embeddings.py +24 -0
mcp_vector_search/core/exceptions.py +11 -0
mcp_vector_search/core/git.py +380 -0
mcp_vector_search/core/git_hooks.py +4 -4
mcp_vector_search/core/indexer.py +632 -54
mcp_vector_search/core/llm_client.py +756 -0
mcp_vector_search/core/models.py +91 -1
mcp_vector_search/core/project.py +17 -0
mcp_vector_search/core/relationships.py +473 -0
mcp_vector_search/core/scheduler.py +11 -11
mcp_vector_search/core/search.py +179 -29
mcp_vector_search/mcp/server.py +819 -9
mcp_vector_search/parsers/python.py +285 -5
mcp_vector_search/utils/__init__.py +2 -0
mcp_vector_search/utils/gitignore.py +0 -3
mcp_vector_search/utils/gitignore_updater.py +212 -0
mcp_vector_search/utils/monorepo.py +66 -4
mcp_vector_search/utils/timing.py +10 -6
{mcp_vector_search-0.12.6.dist-info → mcp_vector_search-1.1.22.dist-info}/METADATA +184 -53
mcp_vector_search-1.1.22.dist-info/RECORD +120 -0
{mcp_vector_search-0.12.6.dist-info → mcp_vector_search-1.1.22.dist-info}/WHEEL +1 -1
{mcp_vector_search-0.12.6.dist-info → mcp_vector_search-1.1.22.dist-info}/entry_points.txt +1 -0
mcp_vector_search/cli/commands/visualize.py +0 -1467
mcp_vector_search-0.12.6.dist-info/RECORD +0 -68
{mcp_vector_search-0.12.6.dist-info → mcp_vector_search-1.1.22.dist-info}/licenses/LICENSE +0 -0

mcp_vector_search/analysis/metrics.py ADDED Viewed

@@ -0,0 +1,414 @@
+"""Metric dataclasses for structural code analysis."""
+from __future__ import annotations
+from dataclasses import dataclass, field
+from datetime import datetime
+from typing import TYPE_CHECKING, Any
+if TYPE_CHECKING:
+    from ..config.thresholds import ThresholdConfig
+@dataclass
+class ChunkMetrics:
+    """Metrics for a single code chunk (function/class/method).
+    Tracks complexity metrics, code smells, and computes quality grades
+    for individual code chunks.
+    Attributes:
+        cognitive_complexity: Cognitive complexity score (how hard to understand)
+        cyclomatic_complexity: Cyclomatic complexity (number of decision paths)
+        max_nesting_depth: Maximum nesting level (if/for/while/try depth)
+        parameter_count: Number of function parameters
+        lines_of_code: Total lines in the chunk
+        smells: List of detected code smells (e.g., "too_many_parameters")
+        complexity_grade: Computed A-F grade based on cognitive complexity
+    """
+    cognitive_complexity: int = 0
+    cyclomatic_complexity: int = 0
+    max_nesting_depth: int = 0
+    parameter_count: int = 0
+    lines_of_code: int = 0
+    # Halstead metrics (Phase 4)
+    halstead_volume: float | None = None
+    halstead_difficulty: float | None = None
+    halstead_effort: float | None = None
+    halstead_bugs: float | None = None
+    # Code smells detected
+    smells: list[str] = field(default_factory=list)
+    # Computed grades (A-F scale)
+    complexity_grade: str = field(init=False, default="A")
+    def __post_init__(self) -> None:
+        """Initialize computed fields after dataclass initialization."""
+        self.complexity_grade = self._compute_grade()
+    def _compute_grade(self, thresholds: ThresholdConfig | None = None) -> str:
+        """Compute A-F grade based on cognitive complexity.
+        Args:
+            thresholds: Optional custom threshold configuration.
+                       If None, uses default thresholds.
+        Grade thresholds (defaults):
+        - A: 0-5 (excellent)
+        - B: 6-10 (good)
+        - C: 11-20 (acceptable)
+        - D: 21-30 (needs improvement)
+        - F: 31+ (refactor recommended)
+        Returns:
+            Letter grade from A to F
+        """
+        if thresholds is None:
+            # Use default thresholds
+            if self.cognitive_complexity <= 5:
+                return "A"
+            elif self.cognitive_complexity <= 10:
+                return "B"
+            elif self.cognitive_complexity <= 20:
+                return "C"
+            elif self.cognitive_complexity <= 30:
+                return "D"
+            else:
+                return "F"
+        else:
+            # Use custom thresholds
+            return thresholds.get_grade(self.cognitive_complexity)
+    def to_metadata(self) -> dict[str, Any]:
+        """Flatten metrics for ChromaDB metadata storage.
+        ChromaDB supports: str, int, float, bool.
+        Lists are converted to JSON strings for compatibility.
+        Returns:
+            Dictionary of flattened metrics compatible with ChromaDB
+        """
+        import json
+        metadata = {
+            "cognitive_complexity": self.cognitive_complexity,
+            "cyclomatic_complexity": self.cyclomatic_complexity,
+            "max_nesting_depth": self.max_nesting_depth,
+            "parameter_count": self.parameter_count,
+            "lines_of_code": self.lines_of_code,
+            "complexity_grade": self.complexity_grade,
+            "code_smells": json.dumps(self.smells),  # Convert list to JSON string
+            "smell_count": len(self.smells),
+        }
+        # Add Halstead metrics if available
+        if self.halstead_volume is not None:
+            metadata["halstead_volume"] = self.halstead_volume
+        if self.halstead_difficulty is not None:
+            metadata["halstead_difficulty"] = self.halstead_difficulty
+        if self.halstead_effort is not None:
+            metadata["halstead_effort"] = self.halstead_effort
+        if self.halstead_bugs is not None:
+            metadata["halstead_bugs"] = self.halstead_bugs
+        return metadata
+@dataclass
+class CouplingMetrics:
+    """Coupling metrics for a file.
+    Tracks dependencies between files to measure coupling.
+    Attributes:
+        efferent_coupling: Number of files this file depends on (outgoing dependencies)
+        afferent_coupling: Number of files that depend on this file (incoming dependencies)
+        imports: List of all imported modules
+        internal_imports: Imports from same project
+        external_imports: Third-party and standard library imports
+        dependents: List of files that import this file
+        instability: Ratio Ce / (Ce + Ca), measures resistance to change (0-1)
+    """
+    efferent_coupling: int = 0  # Ce - outgoing dependencies
+    afferent_coupling: int = 0  # Ca - incoming dependencies
+    imports: list[str] = field(default_factory=list)
+    internal_imports: list[str] = field(default_factory=list)
+    external_imports: list[str] = field(default_factory=list)
+    dependents: list[str] = field(default_factory=list)
+    @property
+    def instability(self) -> float:
+        """Calculate instability metric (0-1).
+        Instability = Ce / (Ce + Ca)
+        Interpretation:
+        - 0.0: Maximally stable (many incoming, few outgoing)
+        - 0.5: Balanced (equal incoming and outgoing)
+        - 1.0: Maximally unstable (many outgoing, few incoming)
+        Returns:
+            Instability ratio from 0.0 to 1.0
+        """
+        total = self.efferent_coupling + self.afferent_coupling
+        if total == 0:
+            return 0.0
+        return self.efferent_coupling / total
+@dataclass
+class FileMetrics:
+    """Aggregated metrics for an entire file.
+    Tracks file-level statistics and aggregates chunk metrics for all
+    functions/classes within the file.
+    Attributes:
+        file_path: Relative or absolute path to the file
+        total_lines: Total lines in file (including blank/comments)
+        code_lines: Lines containing code
+        comment_lines: Lines containing comments
+        blank_lines: Blank lines
+        function_count: Number of top-level functions
+        class_count: Number of classes
+        method_count: Number of methods (functions inside classes)
+        total_complexity: Sum of cognitive complexity across all chunks
+        avg_complexity: Average cognitive complexity per chunk
+        max_complexity: Maximum cognitive complexity in any chunk
+        chunks: List of chunk metrics for each function/class
+        coupling: Coupling metrics for this file
+    """
+    file_path: str
+    total_lines: int = 0
+    code_lines: int = 0
+    comment_lines: int = 0
+    blank_lines: int = 0
+    function_count: int = 0
+    class_count: int = 0
+    method_count: int = 0
+    # Aggregated complexity
+    total_complexity: int = 0
+    avg_complexity: float = 0.0
+    max_complexity: int = 0
+    # Coupling metrics (Phase 3)
+    efferent_coupling: int = 0  # Outgoing dependencies
+    imports: list[str] = field(default_factory=list)  # All imported modules
+    internal_imports: list[str] = field(default_factory=list)  # Same-project imports
+    external_imports: list[str] = field(
+        default_factory=list
+    )  # Third-party/stdlib imports
+    # Chunk metrics for each function/class
+    chunks: list[ChunkMetrics] = field(default_factory=list)
+    # Coupling metrics
+    coupling: CouplingMetrics = field(default_factory=CouplingMetrics)
+    def compute_aggregates(self) -> None:
+        """Compute aggregate metrics from chunk metrics.
+        Calculates total_complexity, avg_complexity, and max_complexity
+        by aggregating values from all chunks.
+        """
+        if not self.chunks:
+            self.total_complexity = 0
+            self.avg_complexity = 0.0
+            self.max_complexity = 0
+            return
+        # Compute complexity aggregates
+        complexities = [chunk.cognitive_complexity for chunk in self.chunks]
+        self.total_complexity = sum(complexities)
+        self.avg_complexity = self.total_complexity / len(self.chunks)
+        self.max_complexity = max(complexities)
+    @property
+    def health_score(self) -> float:
+        """Calculate 0.0-1.0 health score based on metrics.
+        Health score considers:
+        - Average complexity (lower is better)
+        - Code smells count (fewer is better)
+        - Comment ratio (balanced is better)
+        Returns:
+            Health score from 0.0 (poor) to 1.0 (excellent)
+        """
+        score = 1.0
+        # Penalty for high average complexity (A=0%, B=-10%, C=-20%, D=-30%, F=-50%)
+        if self.avg_complexity > 30:
+            score -= 0.5
+        elif self.avg_complexity > 20:
+            score -= 0.3
+        elif self.avg_complexity > 10:
+            score -= 0.2
+        elif self.avg_complexity > 5:
+            score -= 0.1
+        # Penalty for code smells (up to -30%)
+        total_smells = sum(len(chunk.smells) for chunk in self.chunks)
+        smell_penalty = min(0.3, total_smells * 0.05)  # 5% per smell, max 30%
+        score -= smell_penalty
+        # Penalty for poor comment ratio (ideal: 10-30%)
+        if self.total_lines > 0:
+            comment_ratio = self.comment_lines / self.total_lines
+            if comment_ratio < 0.1:  # Too few comments
+                score -= 0.1
+            elif comment_ratio > 0.5:  # Too many comments (suspicious)
+                score -= 0.1
+        return max(0.0, score)  # Clamp to 0.0 minimum
+@dataclass
+class ProjectMetrics:
+    """Project-wide metric aggregates.
+    Tracks project-level statistics and identifies complexity hotspots
+    across the entire codebase.
+    Attributes:
+        project_root: Root directory of the project
+        analyzed_at: Timestamp when analysis was performed
+        total_files: Total number of analyzed files
+        total_lines: Total lines across all files
+        total_functions: Total number of functions
+        total_classes: Total number of classes
+        files: Dictionary mapping file paths to FileMetrics
+        avg_file_complexity: Average complexity across all files
+        hotspots: List of file paths with highest complexity (top 10)
+    """
+    project_root: str
+    analyzed_at: datetime = field(default_factory=datetime.now)
+    total_files: int = 0
+    total_lines: int = 0
+    total_functions: int = 0
+    total_classes: int = 0
+    # File metrics indexed by path
+    files: dict[str, FileMetrics] = field(default_factory=dict)
+    # Project-wide aggregates
+    avg_file_complexity: float = 0.0
+    hotspots: list[str] = field(default_factory=list)  # Top 10 complex files
+    def compute_aggregates(self) -> None:
+        """Compute project-wide aggregates from file metrics.
+        Calculates:
+        - Total files, lines, functions, classes
+        - Average file complexity
+        - Identifies complexity hotspots
+        """
+        if not self.files:
+            self.total_files = 0
+            self.total_lines = 0
+            self.total_functions = 0
+            self.total_classes = 0
+            self.avg_file_complexity = 0.0
+            self.hotspots = []
+            return
+        # Compute totals
+        self.total_files = len(self.files)
+        self.total_lines = sum(f.total_lines for f in self.files.values())
+        self.total_functions = sum(f.function_count for f in self.files.values())
+        self.total_classes = sum(f.class_count for f in self.files.values())
+        # Compute average file complexity
+        file_complexities = [f.avg_complexity for f in self.files.values() if f.chunks]
+        if file_complexities:
+            self.avg_file_complexity = sum(file_complexities) / len(file_complexities)
+        else:
+            self.avg_file_complexity = 0.0
+        # Identify hotspots (top 10 most complex files)
+        hotspot_files = self.get_hotspots(limit=10)
+        self.hotspots = [f.file_path for f in hotspot_files]
+    def get_hotspots(self, limit: int = 10) -> list[FileMetrics]:
+        """Return top N most complex files.
+        Complexity is determined by average cognitive complexity per chunk.
+        Files with no chunks are excluded.
+        Args:
+            limit: Maximum number of hotspots to return
+        Returns:
+            List of FileMetrics sorted by complexity (highest first)
+        """
+        # Filter files with chunks and sort by avg complexity
+        files_with_complexity = [f for f in self.files.values() if f.chunks]
+        sorted_files = sorted(
+            files_with_complexity, key=lambda f: f.avg_complexity, reverse=True
+        )
+        return sorted_files[:limit]
+    def to_summary(self) -> dict[str, Any]:
+        """Generate summary dict for reporting.
+        Returns:
+            Dictionary containing project summary with key metrics
+        """
+        return {
+            "project_root": self.project_root,
+            "analyzed_at": self.analyzed_at.isoformat(),
+            "total_files": self.total_files,
+            "total_lines": self.total_lines,
+            "total_functions": self.total_functions,
+            "total_classes": self.total_classes,
+            "avg_file_complexity": round(self.avg_file_complexity, 2),
+            "hotspots": self.hotspots,
+            "complexity_distribution": self._compute_grade_distribution(),
+            "health_metrics": {
+                "avg_health_score": self._compute_avg_health_score(),
+                "files_needing_attention": self._count_files_needing_attention(),
+            },
+        }
+    def _compute_grade_distribution(self) -> dict[str, int]:
+        """Compute distribution of complexity grades across all chunks.
+        Returns:
+            Dictionary mapping grade (A-F) to count of chunks
+        """
+        distribution: dict[str, int] = {"A": 0, "B": 0, "C": 0, "D": 0, "F": 0}
+        for file_metrics in self.files.values():
+            for chunk in file_metrics.chunks:
+                distribution[chunk.complexity_grade] += 1
+        return distribution
+    def _compute_avg_health_score(self) -> float:
+        """Compute average health score across all files.
+        Returns:
+            Average health score from 0.0 to 1.0
+        """
+        if not self.files:
+            return 1.0
+        health_scores = [f.health_score for f in self.files.values()]
+        return sum(health_scores) / len(health_scores)
+    def _count_files_needing_attention(self) -> int:
+        """Count files with health score below 0.7.
+        Returns:
+            Number of files that need attention
+        """
+        return sum(1 for f in self.files.values() if f.health_score < 0.7)

mcp_vector_search/analysis/reporters/__init__.py ADDED Viewed

@@ -0,0 +1,7 @@
+"""Analysis reporters for outputting metrics in various formats."""
+from .console import ConsoleReporter
+from .markdown import MarkdownReporter
+from .sarif import SARIFReporter
+__all__ = ["ConsoleReporter", "MarkdownReporter", "SARIFReporter"]

mcp-vector-search 0.12.6__py3-none-any.whl → 1.1.22__py3-none-any.whl

mcp-vector-search 0.12.6py3-none-any.whl → 1.1.22py3-none-any.whl