PyPI - mcp-vector-search - Versions diffs - 1.0.3__py3-none-any.whl → 1.1.22__py3-none-any.whl - Mend

mcp-vector-search 1.0.3py3-none-any.whl → 1.1.22py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

mcp_vector_search/__init__.py +3 -3
mcp_vector_search/analysis/__init__.py +48 -1
mcp_vector_search/analysis/baseline/__init__.py +68 -0
mcp_vector_search/analysis/baseline/comparator.py +462 -0
mcp_vector_search/analysis/baseline/manager.py +621 -0
mcp_vector_search/analysis/collectors/__init__.py +35 -0
mcp_vector_search/analysis/collectors/cohesion.py +463 -0
mcp_vector_search/analysis/collectors/coupling.py +1162 -0
mcp_vector_search/analysis/collectors/halstead.py +514 -0
mcp_vector_search/analysis/collectors/smells.py +325 -0
mcp_vector_search/analysis/debt.py +516 -0
mcp_vector_search/analysis/interpretation.py +685 -0
mcp_vector_search/analysis/metrics.py +74 -1
mcp_vector_search/analysis/reporters/__init__.py +3 -1
mcp_vector_search/analysis/reporters/console.py +424 -0
mcp_vector_search/analysis/reporters/markdown.py +480 -0
mcp_vector_search/analysis/reporters/sarif.py +377 -0
mcp_vector_search/analysis/storage/__init__.py +93 -0
mcp_vector_search/analysis/storage/metrics_store.py +762 -0
mcp_vector_search/analysis/storage/schema.py +245 -0
mcp_vector_search/analysis/storage/trend_tracker.py +560 -0
mcp_vector_search/analysis/trends.py +308 -0
mcp_vector_search/analysis/visualizer/__init__.py +90 -0
mcp_vector_search/analysis/visualizer/d3_data.py +534 -0
mcp_vector_search/analysis/visualizer/exporter.py +484 -0
mcp_vector_search/analysis/visualizer/html_report.py +2895 -0
mcp_vector_search/analysis/visualizer/schemas.py +525 -0
mcp_vector_search/cli/commands/analyze.py +665 -11
mcp_vector_search/cli/commands/chat.py +193 -0
mcp_vector_search/cli/commands/index.py +600 -2
mcp_vector_search/cli/commands/index_background.py +467 -0
mcp_vector_search/cli/commands/search.py +194 -1
mcp_vector_search/cli/commands/setup.py +64 -13
mcp_vector_search/cli/commands/status.py +302 -3
mcp_vector_search/cli/commands/visualize/cli.py +26 -10
mcp_vector_search/cli/commands/visualize/exporters/json_exporter.py +8 -4
mcp_vector_search/cli/commands/visualize/graph_builder.py +167 -234
mcp_vector_search/cli/commands/visualize/server.py +304 -15
mcp_vector_search/cli/commands/visualize/templates/base.py +60 -6
mcp_vector_search/cli/commands/visualize/templates/scripts.py +2100 -65
mcp_vector_search/cli/commands/visualize/templates/styles.py +1297 -88
mcp_vector_search/cli/didyoumean.py +5 -0
mcp_vector_search/cli/main.py +16 -5
mcp_vector_search/cli/output.py +134 -5
mcp_vector_search/config/thresholds.py +89 -1
mcp_vector_search/core/__init__.py +16 -0
mcp_vector_search/core/database.py +39 -2
mcp_vector_search/core/embeddings.py +24 -0
mcp_vector_search/core/git.py +380 -0
mcp_vector_search/core/indexer.py +445 -84
mcp_vector_search/core/llm_client.py +9 -4
mcp_vector_search/core/models.py +88 -1
mcp_vector_search/core/relationships.py +473 -0
mcp_vector_search/core/search.py +1 -1
mcp_vector_search/mcp/server.py +795 -4
mcp_vector_search/parsers/python.py +285 -5
mcp_vector_search/utils/gitignore.py +0 -3
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/METADATA +3 -2
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/RECORD +62 -39
mcp_vector_search/cli/commands/visualize.py.original +0 -2536
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/WHEEL +0 -0
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/entry_points.txt +0 -0
{mcp_vector_search-1.0.3.dist-info → mcp_vector_search-1.1.22.dist-info}/licenses/LICENSE +0 -0

mcp_vector_search/cli/commands/status.py CHANGED Viewed

@@ -8,8 +8,11 @@ from typing import Any
 import typer
 from loguru import logger
+from rich.panel import Panel
+from rich.table import Table
 from ... import __version__
+from ...analysis.storage.metrics_store import MetricsStore, MetricsStoreError
 from ...core.database import ChromaVectorDatabase
 from ...core.embeddings import create_embedding_function
 from ...core.exceptions import ProjectNotFoundError
@@ -60,6 +63,13 @@ def main(
         help="Check Claude Code MCP integration status",
         rich_help_panel="🔍 Diagnostics",
     ),
+    metrics: bool = typer.Option(
+        False,
+        "--metrics",
+        "-m",
+        help="Show project metrics summary from latest analysis",
+        rich_help_panel="📊 Display Options",
+    ),
     json_output: bool = typer.Option(
         False,
         "--json",
@@ -78,6 +88,9 @@ def main(
     [green]Quick status check:[/green]
         $ mcp-vector-search status
+    [green]Show code metrics summary:[/green]
+        $ mcp-vector-search status --metrics
     [green]Detailed status with all information:[/green]
         $ mcp-vector-search status --verbose
@@ -89,13 +102,13 @@ def main(
     [green]Full health check:[/green]
         $ mcp-vector-search status --health-check
-    [green]Export status to JSON:[/green]
-        $ mcp-vector-search status --json > status.json
+    [green]Export metrics to JSON:[/green]
+        $ mcp-vector-search status --metrics --json > metrics.json
     [green]Combined diagnostics:[/green]
         $ mcp-vector-search status --verbose --health-check --mcp
-    [dim]💡 Tip: Use --health-check to diagnose issues with dependencies or database.[/dim]
+    [dim]💡 Tip: Use --metrics to see code quality analysis from 'mcp-vector-search analyze'[/dim]
     """
     try:
         # Use provided project_root or current working directory
@@ -111,6 +124,7 @@ def main(
                         verbose=verbose,
                         health_check=health_check,
                         mcp=mcp,
+                        metrics=metrics,
                         json_output=json_output,
                     ),
                     timeout=30.0,  # 30 second timeout
@@ -136,12 +150,20 @@ async def show_status(
     verbose: bool = False,
     health_check: bool = False,
     mcp: bool = False,
+    metrics: bool = False,
     json_output: bool = False,
 ) -> None:
     """Show comprehensive project status."""
     status_data = {}
     try:
+        # If metrics flag is set, show metrics summary and return
+        if metrics:
+            await show_metrics_summary(
+                project_root=project_root,
+                json_output=json_output,
+            )
+            return
         # Check if project is initialized - use the specified project root
         project_manager = ProjectManager(project_root)
@@ -518,6 +540,283 @@ async def check_mcp_integration(
     return mcp_status
+async def show_metrics_summary(
+    project_root: Path,
+    json_output: bool = False,
+) -> None:
+    """Show code metrics summary from latest analysis.
+    Args:
+        project_root: Project root directory
+        json_output: Output as JSON instead of formatted console
+    Raises:
+        typer.Exit: If no metrics found or error occurs
+    """
+    try:
+        # Get metrics storage location
+        storage_dir = project_root / ".mcp-vector-search"
+        db_path = storage_dir / "metrics.db"
+        # Check if metrics database exists
+        if not db_path.exists():
+            if json_output:
+                print_json(
+                    {
+                        "status": "error",
+                        "error": "No metrics found",
+                        "message": "Run 'mcp-vector-search analyze' first",
+                    }
+                )
+            else:
+                console.print(
+                    "[yellow]No metrics found. Run 'mcp-vector-search analyze' first.[/yellow]"
+                )
+            raise typer.Exit(1)
+        # Load metrics store
+        store = MetricsStore(db_path)
+        # Get latest snapshot for this project
+        snapshots = store.get_project_history(str(project_root), limit=1)
+        if not snapshots:
+            if json_output:
+                print_json(
+                    {
+                        "status": "error",
+                        "error": "No metrics found for this project",
+                        "message": "Run 'mcp-vector-search analyze' first",
+                    }
+                )
+            else:
+                console.print(
+                    "[yellow]No metrics found for this project. "
+                    "Run 'mcp-vector-search analyze' first.[/yellow]"
+                )
+            raise typer.Exit(1)
+        latest = snapshots[0]
+        # Output JSON or formatted
+        if json_output:
+            _output_metrics_json(latest)
+        else:
+            _print_metrics_summary(latest)
+    except MetricsStoreError as e:
+        logger.error(f"Failed to load metrics: {e}")
+        if json_output:
+            print_json({"status": "error", "error": str(e)})
+        else:
+            print_error(f"Failed to load metrics: {e}")
+        raise typer.Exit(1)
+    except Exception as e:
+        logger.error(f"Unexpected error loading metrics: {e}")
+        if json_output:
+            print_json({"status": "error", "error": str(e)})
+        else:
+            print_error(f"Unexpected error: {e}")
+        raise typer.Exit(1)
+def _output_metrics_json(snapshot) -> None:
+    """Output metrics snapshot as JSON.
+    Args:
+        snapshot: ProjectSnapshot from metrics store
+    """
+    output = {
+        "status": "success",
+        "snapshot_id": snapshot.snapshot_id,
+        "project_path": snapshot.project_path,
+        "timestamp": snapshot.timestamp.isoformat(),
+        "metrics": {
+            "files": {
+                "total": snapshot.total_files,
+                "needing_attention": sum(
+                    1
+                    for grade, count in snapshot.grade_distribution.items()
+                    if grade in ["D", "F"]
+                    for _ in range(count)
+                ),
+            },
+            "lines": {
+                "total": snapshot.total_lines,
+            },
+            "functions": {
+                "total": snapshot.total_functions,
+            },
+            "classes": {
+                "total": snapshot.total_classes,
+            },
+            "complexity": {
+                "average": round(snapshot.avg_complexity, 2),
+                "maximum": snapshot.max_complexity,
+                "total": snapshot.total_complexity,
+                "grade_distribution": snapshot.grade_distribution,
+            },
+            "code_smells": {
+                "total": snapshot.total_smells,
+            },
+            "health": {
+                "average_score": round(snapshot.avg_health_score, 2),
+            },
+        },
+        "metadata": {
+            "git_commit": snapshot.git_commit,
+            "git_branch": snapshot.git_branch,
+            "tool_version": snapshot.tool_version,
+        },
+    }
+    print_json(output)
+def _print_metrics_summary(snapshot) -> None:
+    """Print formatted metrics summary using Rich.
+    Args:
+        snapshot: ProjectSnapshot from metrics store
+    """
+    # Header panel with overall stats
+    console.print(
+        Panel.fit(
+            f"[bold]Project Metrics Summary[/bold]\n"
+            f"Files: {snapshot.total_files} | "
+            f"Functions: {snapshot.total_functions} | "
+            f"Classes: {snapshot.total_classes} | "
+            f"Lines: {snapshot.total_lines:,}\n"
+            f"Analyzed: {snapshot.timestamp.strftime('%Y-%m-%d %H:%M:%S')}",
+            title="📊 mcp-vector-search",
+            border_style="blue",
+        )
+    )
+    console.print()
+    # Complexity metrics table
+    complexity_table = Table(title="Complexity Metrics", show_header=True)
+    complexity_table.add_column("Metric", style="cyan", no_wrap=True)
+    complexity_table.add_column("Average", justify="right")
+    complexity_table.add_column("Maximum", justify="right")
+    complexity_table.add_column("Total", justify="right")
+    complexity_table.add_column("Status", justify="center")
+    complexity_table.add_row(
+        "Cognitive Complexity",
+        f"{snapshot.avg_complexity:.1f}",
+        f"{snapshot.max_complexity}",
+        f"{snapshot.total_complexity}",
+        _status_indicator(snapshot.avg_complexity, 10, 20),
+    )
+    console.print(complexity_table)
+    console.print()
+    # Grade distribution table
+    grade_table = Table(title="Complexity Grade Distribution", show_header=True)
+    grade_table.add_column("Grade", style="cyan", no_wrap=True)
+    grade_table.add_column("Count", justify="right")
+    grade_table.add_column("Percentage", justify="right")
+    grade_table.add_column("Description")
+    total_chunks = sum(snapshot.grade_distribution.values())
+    grade_descriptions = {
+        "A": "Excellent (0-5)",
+        "B": "Good (6-10)",
+        "C": "Acceptable (11-20)",
+        "D": "Needs Improvement (21-30)",
+        "F": "Refactor Recommended (31+)",
+    }
+    for grade in ["A", "B", "C", "D", "F"]:
+        count = snapshot.grade_distribution.get(grade, 0)
+        percentage = (count / total_chunks * 100) if total_chunks > 0 else 0
+        # Color code the grade
+        grade_color = {
+            "A": "green",
+            "B": "blue",
+            "C": "yellow",
+            "D": "orange1",
+            "F": "red",
+        }.get(grade, "white")
+        grade_table.add_row(
+            f"[{grade_color}]{grade}[/{grade_color}]",
+            str(count),
+            f"{percentage:.1f}%",
+            grade_descriptions[grade],
+        )
+    console.print(grade_table)
+    console.print()
+    # Code smells summary
+    if snapshot.total_smells > 0:
+        console.print(
+            f"[yellow]Code Smells:[/yellow] {snapshot.total_smells} issues detected"
+        )
+        console.print()
+    # Health score
+    health_color = (
+        "green"
+        if snapshot.avg_health_score >= 0.8
+        else "yellow"
+        if snapshot.avg_health_score >= 0.6
+        else "red"
+    )
+    console.print(
+        f"[bold]Health Score:[/bold] [{health_color}]{snapshot.avg_health_score:.2f}[/{health_color}] / 1.00"
+    )
+    console.print()
+    # Git metadata (if available)
+    if snapshot.git_commit or snapshot.git_branch:
+        metadata_parts = []
+        if snapshot.git_branch:
+            metadata_parts.append(f"Branch: {snapshot.git_branch}")
+        if snapshot.git_commit:
+            metadata_parts.append(f"Commit: {snapshot.git_commit[:8]}")
+        if snapshot.tool_version:
+            metadata_parts.append(f"Version: {snapshot.tool_version}")
+        console.print(f"[dim]{' | '.join(metadata_parts)}[/dim]")
+        console.print()
+    # Files needing attention
+    files_needing_attention = snapshot.grade_distribution.get(
+        "D", 0
+    ) + snapshot.grade_distribution.get("F", 0)
+    if files_needing_attention > 0:
+        console.print(
+            f"[yellow]⚠️  {files_needing_attention} code chunks need attention (grades D or F)[/yellow]"
+        )
+        console.print()
+def _status_indicator(
+    value: float, warning_threshold: float, error_threshold: float
+) -> str:
+    """Return colored status indicator based on thresholds.
+    Args:
+        value: Value to check
+        warning_threshold: Warning threshold (yellow)
+        error_threshold: Error threshold (red)
+    Returns:
+        Colored status indicator (green, yellow, or red dot)
+    """
+    if value < warning_threshold:
+        return "[green]●[/green]"
+    elif value < error_threshold:
+        return "[yellow]●[/yellow]"
+    else:
+        return "[red]●[/red]"
 def check_dependencies() -> bool:
     """Check if all required dependencies are available.

mcp_vector_search/cli/commands/visualize/cli.py CHANGED Viewed

@@ -24,21 +24,22 @@ from .graph_builder import build_graph_data
 from .server import find_free_port, start_visualization_server
 app = typer.Typer(
-    help="Visualize code chunk relationships",
+    help="📊 Visualize code chunk relationships",
+    invoke_without_command=True,
 )
 console = Console()
-@app.callback(invoke_without_command=True)
+@app.callback()
 def visualize_callback(ctx: typer.Context) -> None:
     """Visualize code chunk relationships.
-    When called without a subcommand, automatically starts the visualization server.
+    If no subcommand is provided, defaults to starting the visualization server.
     """
-    # If no subcommand was invoked, run serve with defaults
     if ctx.invoked_subcommand is None:
-        # Call serve directly with default parameters
-        serve(port=8080, graph_file=Path("chunk-graph.json"), code_only=False)
+        # Default to serve when no subcommand given
+        # Must pass explicit defaults since typer.Option doesn't work when called directly
+        serve(port=8501, graph_file=Path("chunk-graph.json"), code_only=False)
 @app.command()
@@ -185,7 +186,7 @@ async def _export_chunks(
 @app.command()
 def serve(
     port: int = typer.Option(
-        8080, "--port", "-p", help="Port for visualization server"
+        8501, "--port", "-p", help="Port for visualization server"
     ),
     graph_file: Path = typer.Option(
         Path("chunk-graph.json"),
@@ -202,7 +203,7 @@ def serve(
     """Start local HTTP server for D3.js visualization.
     Examples:
-        # Start server on default port 8080
+        # Start server on default port 8501
         mcp-vector-search visualize serve
         # Custom port
@@ -215,9 +216,9 @@ def serve(
         mcp-vector-search visualize serve --code-only
     """
     # Use specified port or find free one
-    if port == 8080:  # Default port, try to find free one
+    if port == 8501:  # Default port, try to find free one
         try:
-            port = find_free_port(8080, 8099)
+            port = find_free_port(8501, 8599)
         except OSError as e:
             console.print(f"[red]✗ {e}[/red]")
             raise typer.Exit(1)
@@ -245,8 +246,23 @@ def serve(
         export_to_html(html_file)
     # Check if we need to regenerate the graph file
+    # Regenerate if: graph doesn't exist, code_only filter, or index is newer than graph
     needs_regeneration = not graph_file.exists() or code_only
+    # Check if index database is newer than graph (stale graph detection)
+    if graph_file.exists() and not needs_regeneration:
+        index_db = (
+            project_manager.project_root / ".mcp-vector-search" / "chroma.sqlite3"
+        )
+        if index_db.exists():
+            graph_mtime = graph_file.stat().st_mtime
+            index_mtime = index_db.stat().st_mtime
+            if index_mtime > graph_mtime:
+                console.print(
+                    "[yellow]Index has changed since graph was generated. Regenerating...[/yellow]"
+                )
+                needs_regeneration = True
     if graph_file.exists() and not needs_regeneration:
         # Use existing unfiltered file
         dest = viz_dir / "chunk-graph.json"

mcp_vector_search/cli/commands/visualize/exporters/json_exporter.py CHANGED Viewed

@@ -1,12 +1,13 @@
 """JSON export functionality for graph data.
 This module handles exporting graph data to JSON format.
+Uses orjson for 5-10x faster serialization performance.
 """
-import json
 from pathlib import Path
 from typing import Any
+import orjson
 from rich.console import Console
 console = Console()
@@ -15,6 +16,8 @@ console = Console()
 def export_to_json(graph_data: dict[str, Any], output_path: Path) -> None:
     """Export graph data to JSON file.
+    Uses orjson for fast serialization (5-10x faster than stdlib json).
     Args:
         graph_data: Graph data dictionary containing nodes, links, and metadata
         output_path: Path to output JSON file
@@ -22,8 +25,9 @@ def export_to_json(graph_data: dict[str, Any], output_path: Path) -> None:
     # Ensure output directory exists
     output_path.parent.mkdir(parents=True, exist_ok=True)
-    # Write to file
-    with open(output_path, "w") as f:
-        json.dump(graph_data, f, indent=2)
+    # Write to file using orjson for fast serialization
+    # OPT_INDENT_2 gives readable output, OPT_SORT_KEYS for consistency
+    with open(output_path, "wb") as f:
+        f.write(orjson.dumps(graph_data, option=orjson.OPT_INDENT_2))
     console.print(f"[green]✓[/green] Exported graph data to [cyan]{output_path}[/cyan]")

mcp-vector-search 1.0.3__py3-none-any.whl → 1.1.22__py3-none-any.whl

mcp-vector-search 1.0.3py3-none-any.whl → 1.1.22py3-none-any.whl