PyPI - mcp-vector-search - Versions diffs - 1.0.3__py3-none-any.whl → 1.1.22__py3-none-any.whl - Mend

mcp-vector-search 1.0.3py3-none-any.whl → 1.1.22py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

mcp_vector_search/__init__.py +3 -3
mcp_vector_search/analysis/__init__.py +48 -1
mcp_vector_search/analysis/baseline/__init__.py +68 -0
mcp_vector_search/analysis/baseline/comparator.py +462 -0
mcp_vector_search/analysis/baseline/manager.py +621 -0
mcp_vector_search/analysis/collectors/__init__.py +35 -0
mcp_vector_search/analysis/collectors/cohesion.py +463 -0
mcp_vector_search/analysis/collectors/coupling.py +1162 -0
mcp_vector_search/analysis/collectors/halstead.py +514 -0
mcp_vector_search/analysis/collectors/smells.py +325 -0
mcp_vector_search/analysis/debt.py +516 -0
mcp_vector_search/analysis/interpretation.py +685 -0
mcp_vector_search/analysis/metrics.py +74 -1
mcp_vector_search/analysis/reporters/__init__.py +3 -1
mcp_vector_search/analysis/reporters/console.py +424 -0
mcp_vector_search/analysis/reporters/markdown.py +480 -0
mcp_vector_search/analysis/reporters/sarif.py +377 -0
mcp_vector_search/analysis/storage/__init__.py +93 -0
mcp_vector_search/analysis/storage/metrics_store.py +762 -0
mcp_vector_search/analysis/storage/schema.py +245 -0
mcp_vector_search/analysis/storage/trend_tracker.py +560 -0
mcp_vector_search/analysis/trends.py +308 -0
mcp_vector_search/analysis/visualizer/__init__.py +90 -0
mcp_vector_search/analysis/visualizer/d3_data.py +534 -0
mcp_vector_search/analysis/visualizer/exporter.py +484 -0
mcp_vector_search/analysis/visualizer/html_report.py +2895 -0
mcp_vector_search/analysis/visualizer/schemas.py +525 -0
mcp_vector_search/cli/commands/analyze.py +665 -11
mcp_vector_search/cli/commands/chat.py +193 -0
mcp_vector_search/cli/commands/index.py +600 -2
mcp_vector_search/cli/commands/index_background.py +467 -0
mcp_vector_search/cli/commands/search.py +194 -1
mcp_vector_search/cli/commands/setup.py +64 -13
mcp_vector_search/cli/commands/status.py +302 -3
mcp_vector_search/cli/commands/visualize/cli.py +26 -10
mcp_vector_search/cli/commands/visualize/exporters/json_exporter.py +8 -4
mcp_vector_search/cli/commands/visualize/graph_builder.py +167 -234
mcp_vector_search/cli/commands/visualize/server.py +304 -15
mcp_vector_search/cli/commands/visualize/templates/base.py +60 -6
mcp_vector_search/cli/commands/visualize/templates/scripts.py +2100 -65
mcp_vector_search/cli/commands/visualize/templates/styles.py +1297 -88
mcp_vector_search/cli/didyoumean.py +5 -0
mcp_vector_search/cli/main.py +16 -5
mcp_vector_search/cli/output.py +134 -5
mcp_vector_search/config/thresholds.py +89 -1
mcp_vector_search/core/__init__.py +16 -0
mcp_vector_search/core/database.py +39 -2
mcp_vector_search/core/embeddings.py +24 -0
mcp_vector_search/core/git.py +380 -0
mcp_vector_search/core/indexer.py +445 -84
mcp_vector_search/core/llm_client.py +9 -4
mcp_vector_search/core/models.py +88 -1
mcp_vector_search/core/relationships.py +473 -0
mcp_vector_search/core/search.py +1 -1
mcp_vector_search/mcp/server.py +795 -4
mcp_vector_search/parsers/python.py +285 -5
mcp_vector_search/utils/gitignore.py +0 -3
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/METADATA +3 -2
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/RECORD +62 -39
mcp_vector_search/cli/commands/visualize.py.original +0 -2536
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/WHEEL +0 -0
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/entry_points.txt +0 -0
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/licenses/LICENSE +0 -0

mcp_vector_search/analysis/reporters/sarif.py ADDED Viewed

@@ -0,0 +1,377 @@
+"""SARIF 2.1.0 output format for code analysis results.
+This module provides SARIF (Static Analysis Results Interchange Format) 2.1.0
+compliant output for code smells and structural analysis results. SARIF is an
+OASIS standard format for sharing static analysis results between tools.
+SARIF Specification: https://docs.oasis-open.org/sarif/sarif/v2.1.0/sarif-v2.1.0.html
+Example:
+    >>> from pathlib import Path
+    >>> from ..collectors.smells import CodeSmell, SmellSeverity
+    >>> reporter = SARIFReporter()
+    >>> smells = [CodeSmell(...)]
+    >>> reporter.write_sarif(smells, Path("report.sarif"))
+"""
+from __future__ import annotations
+import hashlib
+import json
+from dataclasses import dataclass
+from datetime import UTC, datetime
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+if TYPE_CHECKING:
+    from ..collectors.smells import CodeSmell, SmellSeverity
+@dataclass
+class SARIFReporter:
+    """Generate SARIF 2.1.0 formatted reports for code analysis.
+    SARIF (Static Analysis Results Interchange Format) is an industry-standard
+    JSON-based format for static analysis tool output, enabling integration with
+    IDEs, CI/CD systems, and security tools.
+    Attributes:
+        tool_name: Name of the analysis tool (default: "MCP Vector Search")
+        tool_version: Version of the tool (default: from package)
+        tool_uri: URI to tool documentation/homepage
+        include_help_text: Include help text for each rule (default: True)
+        include_fingerprints: Include result fingerprints for deduplication (default: True)
+    Example:
+        >>> reporter = SARIFReporter()
+        >>> sarif_doc = reporter.generate_sarif(code_smells, base_path=Path("/project"))
+        >>> reporter.write_sarif(code_smells, Path("report.sarif"))
+    """
+    tool_name: str = "MCP Vector Search"
+    tool_version: str = "1.0.3"
+    tool_uri: str = "https://github.com/bobmatnyc/mcp-vector-search"
+    include_help_text: bool = True
+    include_fingerprints: bool = True
+    def generate_sarif(
+        self, smells: list[CodeSmell], base_path: Path | None = None
+    ) -> dict[str, Any]:
+        """Generate SARIF 2.1.0 document from code smells.
+        Creates a complete SARIF document with tool metadata, rules, and results.
+        All file paths are made relative to base_path if provided.
+        Args:
+            smells: List of detected code smells to report
+            base_path: Base directory for making paths relative (optional)
+                      If None, uses absolute paths
+        Returns:
+            Dictionary containing SARIF 2.1.0 compliant document structure
+        Example:
+            >>> smells = [CodeSmell(name="Long Method", ...)]
+            >>> sarif = reporter.generate_sarif(smells, Path.cwd())
+            >>> print(json.dumps(sarif, indent=2))
+        """
+        # Build unique rules from all smells
+        rules = self._build_rules(smells)
+        # Convert smells to SARIF results
+        results = [self._smell_to_result(smell, base_path) for smell in smells]
+        # Build complete SARIF document
+        sarif_doc = {
+            "$schema": "https://json.schemastore.org/sarif-2.1.0.json",
+            "version": "2.1.0",
+            "runs": [
+                {
+                    "tool": {
+                        "driver": {
+                            "name": self.tool_name,
+                            "version": self.tool_version,
+                            "informationUri": self.tool_uri,
+                            "rules": rules,
+                        }
+                    },
+                    "results": results,
+                    "invocations": [
+                        {
+                            "executionSuccessful": True,
+                            "endTimeUtc": datetime.now(UTC).isoformat(),
+                        }
+                    ],
+                }
+            ],
+        }
+        return sarif_doc
+    def write_sarif(
+        self,
+        smells: list[CodeSmell],
+        output_path: Path,
+        base_path: Path | None = None,
+        indent: int = 2,
+    ) -> None:
+        """Write SARIF report to file.
+        Generates SARIF document and writes it to the specified path with
+        pretty-printing for readability.
+        Args:
+            smells: List of code smells to report
+            output_path: Path where SARIF file should be written
+            base_path: Base directory for relative paths (optional)
+            indent: JSON indentation level (default: 2, 0 for compact)
+        Raises:
+            IOError: If file cannot be written
+            OSError: If directory does not exist
+        Example:
+            >>> reporter.write_sarif(smells, Path("report.sarif"), indent=2)
+        """
+        sarif_doc = self.generate_sarif(smells, base_path)
+        # Ensure parent directory exists
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        # Write with pretty-printing
+        with open(output_path, "w", encoding="utf-8") as f:
+            if indent > 0:
+                json.dump(sarif_doc, f, indent=indent, ensure_ascii=False)
+            else:
+                json.dump(sarif_doc, f, ensure_ascii=False)
+    def _severity_to_level(self, severity: SmellSeverity) -> str:
+        """Map SmellSeverity to SARIF level.
+        SARIF defines three result levels: error, warning, note.
+        We map our SmellSeverity enum to these levels.
+        Args:
+            severity: SmellSeverity enum value
+        Returns:
+            SARIF level string ("error", "warning", or "note")
+        Mapping:
+            ERROR -> "error" (requires immediate attention)
+            WARNING -> "warning" (should be addressed)
+            INFO -> "note" (informational)
+        """
+        from ..collectors.smells import SmellSeverity
+        mapping = {
+            SmellSeverity.ERROR: "error",
+            SmellSeverity.WARNING: "warning",
+            SmellSeverity.INFO: "note",
+        }
+        return mapping.get(severity, "warning")
+    def _smell_to_rule_id(self, smell_name: str) -> str:
+        """Convert smell name to SARIF rule ID (kebab-case).
+        Transforms human-readable smell names to kebab-case IDs suitable
+        for use as SARIF rule identifiers.
+        Args:
+            smell_name: Human-readable smell name (e.g., "Long Method")
+        Returns:
+            Kebab-case rule ID (e.g., "long-method")
+        Examples:
+            >>> reporter._smell_to_rule_id("Long Method")
+            'long-method'
+            >>> reporter._smell_to_rule_id("God Class")
+            'god-class'
+            >>> reporter._smell_to_rule_id("Deep_Nesting")
+            'deep-nesting'
+        """
+        return smell_name.lower().replace(" ", "-").replace("_", "-")
+    def _build_rules(self, smells: list[CodeSmell]) -> list[dict[str, Any]]:
+        """Generate unique rules from code smells.
+        Creates SARIF rule definitions for all unique smell types found.
+        Each rule includes ID, description, and help text.
+        Args:
+            smells: List of code smells to extract rules from
+        Returns:
+            List of SARIF rule objects with metadata
+        SARIF Rule Structure:
+            - id: Unique rule identifier (kebab-case)
+            - shortDescription: Brief rule description
+            - help: Detailed help text with suggestions
+            - properties: Additional metadata (optional)
+        """
+        # Track unique smell types
+        unique_smells: dict[str, CodeSmell] = {}
+        for smell in smells:
+            rule_id = self._smell_to_rule_id(smell.name)
+            if rule_id not in unique_smells:
+                unique_smells[rule_id] = smell
+        # Build rule definitions
+        rules = []
+        for rule_id, smell in unique_smells.items():
+            rule = {
+                "id": rule_id,
+                "shortDescription": {"text": smell.name},
+                "fullDescription": {"text": self._get_smell_description(smell.name)},
+            }
+            # Add help text if enabled
+            if self.include_help_text and smell.suggestion:
+                rule["help"] = {"text": smell.suggestion}
+            # Add default severity configuration
+            rule["defaultConfiguration"] = {
+                "level": self._severity_to_level(smell.severity)
+            }
+            rules.append(rule)
+        return rules
+    def _get_smell_description(self, smell_name: str) -> str:
+        """Get detailed description for code smell type.
+        Provides comprehensive descriptions for each smell type to help
+        developers understand what the issue is and why it matters.
+        Args:
+            smell_name: Name of the code smell
+        Returns:
+            Detailed description explaining the smell and its impact
+        """
+        descriptions = {
+            "Long Method": "Method or function exceeds recommended length thresholds, making it harder to understand, test, and maintain. Long methods often indicate that the function is doing too much and violates the Single Responsibility Principle.",
+            "Deep Nesting": "Code has excessive nesting depth (nested if/for/while blocks), reducing readability and increasing cognitive complexity. Deep nesting makes it harder to understand control flow and increases the likelihood of bugs.",
+            "Long Parameter List": "Function or method has too many parameters, making the API difficult to use and understand. Consider using parameter objects, builder pattern, or decomposing the function into smaller pieces.",
+            "God Class": "Class has too many responsibilities, indicated by high method count and large size. This violates the Single Responsibility Principle and makes the class difficult to maintain, test, and reason about.",
+            "Complex Method": "Method has high cyclomatic complexity (many decision points), making it difficult to test and prone to bugs. High complexity indicates complex control flow that should be simplified or decomposed.",
+        }
+        return descriptions.get(
+            smell_name,
+            f"Code smell detected: {smell_name}. Consider refactoring to improve maintainability.",
+        )
+    def _smell_to_result(
+        self, smell: CodeSmell, base_path: Path | None = None
+    ) -> dict[str, Any]:
+        """Convert CodeSmell to SARIF result object.
+        Transforms a CodeSmell into SARIF result format with location,
+        message, and optional fingerprint for deduplication.
+        Args:
+            smell: Code smell to convert
+            base_path: Base path for making file paths relative (optional)
+        Returns:
+            SARIF result object with location and message
+        SARIF Result Structure:
+            - ruleId: Reference to rule definition
+            - level: Severity level (error/warning/note)
+            - message: Human-readable message
+            - locations: Where the issue was found
+            - partialFingerprints: For result deduplication (optional)
+        """
+        # Parse location string (format: "file:line" or "file")
+        location_parts = smell.location.rsplit(":", 1)
+        file_path = location_parts[0]
+        line_number = int(location_parts[1]) if len(location_parts) > 1 else None
+        # Make path relative if base_path provided
+        if base_path:
+            try:
+                file_path_obj = Path(file_path)
+                if file_path_obj.is_absolute():
+                    file_path = str(file_path_obj.relative_to(base_path))
+            except (ValueError, OSError):
+                # Keep original path if relative_to fails
+                pass
+        # Build SARIF result
+        result: dict[str, Any] = {
+            "ruleId": self._smell_to_rule_id(smell.name),
+            "level": self._severity_to_level(smell.severity),
+            "message": {
+                "text": (
+                    f"{smell.name}: {smell.description}"
+                    if smell.description
+                    else smell.name
+                )
+            },
+            "locations": [
+                {
+                    "physicalLocation": {
+                        "artifactLocation": {
+                            "uri": file_path,
+                        }
+                    }
+                }
+            ],
+        }
+        # Add region (line number) if available
+        if line_number is not None:
+            result["locations"][0]["physicalLocation"]["region"] = {
+                "startLine": line_number
+            }
+        # Add fingerprint for deduplication if enabled
+        if self.include_fingerprints:
+            result["partialFingerprints"] = {
+                "primaryLocationLineHash": self._compute_fingerprint(smell)
+            }
+        # Add additional properties
+        result["properties"] = {
+            "metricValue": smell.metric_value,
+            "threshold": smell.threshold,
+        }
+        return result
+    def _compute_fingerprint(self, smell: CodeSmell) -> str:
+        """Generate stable fingerprint for result deduplication.
+        Creates a SHA-256 hash of key smell attributes to enable
+        deduplication across runs and comparison of results over time.
+        Args:
+            smell: Code smell to fingerprint
+        Returns:
+            16-character hex string fingerprint
+        Fingerprint Includes:
+            - Smell name (type of issue)
+            - Location (file:line)
+            - Metric value (normalized to string)
+        Example:
+            >>> smell = CodeSmell(name="Long Method", location="file.py:10", ...)
+            >>> fingerprint = reporter._compute_fingerprint(smell)
+            >>> len(fingerprint)
+            16
+        """
+        # Normalize metric value to avoid floating point differences
+        normalized_metric = f"{smell.metric_value:.1f}"
+        # Build fingerprint content
+        content = f"{smell.name}:{smell.location}:{normalized_metric}"
+        # Compute SHA-256 and take first 16 characters
+        return hashlib.sha256(content.encode()).hexdigest()[:16]

mcp_vector_search/analysis/storage/__init__.py ADDED Viewed

@@ -0,0 +1,93 @@
+"""Storage module for metrics persistence and historical tracking.
+This module provides SQLite-based storage for code metrics, enabling:
+- Historical tracking of file and project metrics over time
+- Trend analysis to identify improving/degrading code quality
+- Snapshot comparison for release-to-release analysis
+- Code smell tracking and remediation monitoring
+Public API:
+    - MetricsStore: Main storage interface
+    - ProjectSnapshot: Project-wide metrics at a point in time
+    - TrendData: Trend analysis results
+    - GitInfo: Git metadata for traceability
+Exceptions:
+    - MetricsStoreError: Base exception for storage errors
+    - DatabaseLockedError: Database locked by another process
+    - DuplicateEntryError: Attempted duplicate entry
+Example Usage:
+    >>> from mcp_vector_search.analysis.storage import MetricsStore
+    >>> from mcp_vector_search.analysis.metrics import ProjectMetrics
+    >>>
+    >>> # Initialize store (uses default ~/.mcp-vector-search/metrics.db)
+    >>> store = MetricsStore()
+    >>>
+    >>> # Save complete snapshot
+    >>> metrics = ProjectMetrics(project_root="/path/to/project")
+    >>> # ... populate metrics ...
+    >>> snapshot_id = store.save_complete_snapshot(metrics)
+    >>>
+    >>> # Query history
+    >>> history = store.get_project_history("/path/to/project", limit=10)
+    >>> for snapshot in history:
+    ...     print(f"{snapshot.timestamp}: {snapshot.avg_complexity:.2f}")
+    >>>
+    >>> # Analyze trends
+    >>> trends = store.get_trends("/path/to/project", days=30)
+    >>> if trends.improving:
+    ...     print(f"Complexity improving at {abs(trends.change_rate):.4f}/day")
+    >>> else:
+    ...     print(f"Complexity degrading at {trends.change_rate:.4f}/day")
+    >>>
+    >>> store.close()
+Context Manager Usage:
+    >>> with MetricsStore() as store:
+    ...     snapshot_id = store.save_complete_snapshot(metrics)
+    ...     # Connection automatically closed
+See Also:
+    - schema.py: Database schema definitions
+    - metrics_store.py: MetricsStore implementation
+"""
+from .metrics_store import (
+    DatabaseLockedError,
+    DuplicateEntryError,
+    GitInfo,
+    MetricsStore,
+    MetricsStoreError,
+    ProjectSnapshot,
+    TrendData,
+)
+from .schema import SCHEMA_VERSION
+from .trend_tracker import (
+    FileRegression,
+    TrendDirection,
+    TrendTracker,
+)
+from .trend_tracker import (
+    TrendData as EnhancedTrendData,
+)
+__all__ = [
+    # Main storage class
+    "MetricsStore",
+    # Trend tracking
+    "TrendTracker",
+    "TrendDirection",
+    "FileRegression",
+    # Data classes
+    "ProjectSnapshot",
+    "TrendData",
+    "EnhancedTrendData",
+    "GitInfo",
+    # Exceptions
+    "MetricsStoreError",
+    "DatabaseLockedError",
+    "DuplicateEntryError",
+    # Schema version
+    "SCHEMA_VERSION",
+]

mcp-vector-search 1.0.3__py3-none-any.whl → 1.1.22__py3-none-any.whl

mcp-vector-search 1.0.3py3-none-any.whl → 1.1.22py3-none-any.whl