PyPI - kg-mcp - Versions diffs - 0.1.8__py3-none-any.whl - Mend

kg-mcp 0.1.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

kg_mcp/__init__.py +5 -0
kg_mcp/__main__.py +8 -0
kg_mcp/cli/__init__.py +3 -0
kg_mcp/cli/setup.py +1100 -0
kg_mcp/cli/status.py +344 -0
kg_mcp/codegraph/__init__.py +3 -0
kg_mcp/codegraph/indexer.py +296 -0
kg_mcp/codegraph/model.py +170 -0
kg_mcp/config.py +83 -0
kg_mcp/kg/__init__.py +3 -0
kg_mcp/kg/apply_schema.py +93 -0
kg_mcp/kg/ingest.py +253 -0
kg_mcp/kg/neo4j.py +155 -0
kg_mcp/kg/repo.py +756 -0
kg_mcp/kg/retrieval.py +225 -0
kg_mcp/kg/schema.cypher +176 -0
kg_mcp/llm/__init__.py +4 -0
kg_mcp/llm/client.py +291 -0
kg_mcp/llm/prompts/__init__.py +8 -0
kg_mcp/llm/prompts/extractor.py +84 -0
kg_mcp/llm/prompts/linker.py +117 -0
kg_mcp/llm/schemas.py +248 -0
kg_mcp/main.py +195 -0
kg_mcp/mcp/__init__.py +3 -0
kg_mcp/mcp/change_schemas.py +140 -0
kg_mcp/mcp/prompts.py +223 -0
kg_mcp/mcp/resources.py +218 -0
kg_mcp/mcp/tools.py +537 -0
kg_mcp/security/__init__.py +3 -0
kg_mcp/security/auth.py +121 -0
kg_mcp/security/origin.py +112 -0
kg_mcp/utils.py +100 -0
kg_mcp-0.1.8.dist-info/METADATA +86 -0
kg_mcp-0.1.8.dist-info/RECORD +36 -0
kg_mcp-0.1.8.dist-info/WHEEL +4 -0
kg_mcp-0.1.8.dist-info/entry_points.txt +4 -0

kg_mcp/mcp/tools.py ADDED Viewed

@@ -0,0 +1,537 @@
+"""
+MCP Tool definitions for the Knowledge Graph Memory Server.
+This module exposes ONLY 2 tools to AI agents:
+- kg_autopilot: Call at the START of every task
+- kg_track_changes: Call AFTER every file modification
+All other functionality is internal and not exposed via MCP.
+"""
+import logging
+from typing import Any, Dict, List, Optional
+from mcp.server.fastmcp import FastMCP
+from kg_mcp.kg.ingest import get_ingest_pipeline
+from kg_mcp.kg.retrieval import get_context_builder
+from kg_mcp.kg.repo import get_repository
+from kg_mcp.utils import serialize_response
+logger = logging.getLogger(__name__)
+# =============================================================================
+# INTERNAL HELPER FUNCTIONS (Not exposed via MCP)
+# =============================================================================
+async def _ingest_message(
+    project_id: str,
+    user_text: str,
+    files: Optional[List[str]] = None,
+    diff: Optional[str] = None,
+    symbols: Optional[List[str]] = None,
+    tags: Optional[List[str]] = None,
+) -> Dict[str, Any]:
+    """
+    Internal: Analyze and save a user request to the knowledge graph.
+    Called by kg_autopilot.
+    """
+    logger.info(f"_ingest_message called for project {project_id}")
+    try:
+        pipeline = get_ingest_pipeline()
+        result = await pipeline.process_message(
+            project_id=project_id,
+            user_text=user_text,
+            files=files,
+            diff=diff,
+            symbols=symbols,
+            tags=tags,
+        )
+        return serialize_response(result)
+    except Exception as e:
+        logger.error(f"_ingest_message failed: {e}")
+        return {
+            "error": str(e),
+            "interaction_id": None,
+            "extracted": {},
+            "created_entities": {},
+        }
+async def _context_pack(
+    project_id: str,
+    focus_goal_id: Optional[str] = None,
+    query: Optional[str] = None,
+    k_hops: int = 2,
+) -> Dict[str, Any]:
+    """
+    Internal: Build a comprehensive context pack from the knowledge graph.
+    Called by kg_autopilot.
+    """
+    logger.info(f"_context_pack called for project {project_id}")
+    try:
+        builder = get_context_builder()
+        result = await builder.build_context_pack(
+            project_id=project_id,
+            focus_goal_id=focus_goal_id,
+            query=query,
+            k_hops=k_hops,
+        )
+        return serialize_response(result)
+    except Exception as e:
+        logger.error(f"_context_pack failed: {e}")
+        return {
+            "error": str(e),
+            "markdown": f"# Error\n\nFailed to build context: {e}",
+            "entities": {},
+        }
+async def _search(
+    project_id: str,
+    query: str,
+    filters: Optional[List[str]] = None,
+    limit: int = 20,
+) -> Dict[str, Any]:
+    """
+    Internal: Search the knowledge graph using fulltext + traversal.
+    Called by kg_autopilot when search_query is provided.
+    """
+    logger.info(f"_search called: '{query}' in project {project_id}")
+    try:
+        repo = get_repository()
+        results = await repo.fulltext_search(
+            project_id=project_id,
+            query=query,
+            node_types=filters,
+            limit=limit,
+        )
+        return serialize_response({
+            "results": results,
+            "total": len(results),
+            "query": query,
+        })
+    except Exception as e:
+        logger.error(f"_search failed: {e}")
+        return {
+            "error": str(e),
+            "results": [],
+            "total": 0,
+        }
+async def _link_code_artifact(
+    project_id: str,
+    path: str,
+    kind: str = "file",
+    language: Optional[str] = None,
+    symbol_fqn: Optional[str] = None,
+    start_line: Optional[int] = None,
+    end_line: Optional[int] = None,
+    git_commit: Optional[str] = None,
+    content_hash: Optional[str] = None,
+    related_goal_ids: Optional[List[str]] = None,
+) -> Dict[str, Any]:
+    """
+    Internal: Link a code artifact to the knowledge graph.
+    Called by kg_track_changes.
+    """
+    logger.info(f"_link_code_artifact called: {path}")
+    try:
+        repo = get_repository()
+        artifact = await repo.upsert_code_artifact(
+            project_id=project_id,
+            path=path,
+            kind=kind,
+            language=language,
+            symbol_fqn=symbol_fqn,
+            start_line=start_line,
+            end_line=end_line,
+            git_commit=git_commit,
+            content_hash=content_hash,
+            related_goal_ids=related_goal_ids,
+        )
+        return {
+            "artifact_id": artifact.get("id"),
+            "path": path,
+            "linked_goals": len(related_goal_ids) if related_goal_ids else 0,
+        }
+    except Exception as e:
+        logger.error(f"_link_code_artifact failed: {e}")
+        return {
+            "error": str(e),
+            "artifact_id": None,
+        }
+async def _impact_analysis(
+    project_id: str,
+    changed_paths: Optional[List[str]] = None,
+    changed_symbols: Optional[List[str]] = None,
+) -> Dict[str, Any]:
+    """
+    Internal: Analyze the impact of code changes.
+    Called by kg_track_changes when check_impact=True.
+    """
+    logger.info(f"_impact_analysis called for project {project_id}")
+    if not changed_paths and not changed_symbols:
+        return {
+            "error": "At least one of changed_paths or changed_symbols is required",
+            "goals_to_retest": [],
+            "tests_to_run": [],
+            "strategies_to_review": [],
+            "artifacts_related": [],
+        }
+    try:
+        repo = get_repository()
+        paths = changed_paths or []
+        result = await repo.get_impact_for_artifacts(project_id, paths)
+        return serialize_response(result)
+    except Exception as e:
+        logger.error(f"_impact_analysis failed: {e}")
+        return {
+            "error": str(e),
+            "goals_to_retest": [],
+            "tests_to_run": [],
+            "strategies_to_review": [],
+            "artifacts_related": [],
+        }
+# =============================================================================
+# MCP TOOL REGISTRATION (Only 2 tools exposed)
+# =============================================================================
+def register_tools(mcp: FastMCP) -> None:
+    """
+    Register MCP tools with the server.
+    Only 2 tools are exposed:
+    - kg_autopilot: For starting tasks
+    - kg_track_changes: For tracking file modifications
+    """
+    @mcp.tool()
+    async def kg_autopilot(
+        project_id: str,
+        user_text: str,
+        search_query: Optional[str] = None,
+        files: Optional[List[str]] = None,
+        diff: Optional[str] = None,
+        symbols: Optional[List[str]] = None,
+        tags: Optional[List[str]] = None,
+        k_hops: int = 2,
+    ) -> Dict[str, Any]:
+        """
+        🚀 CALL THIS TOOL AT THE START OF EVERY TASK.
+        ⚠️ DO NOT CALL THIS TOOL AFTER CREATING/MODIFYING FILES!
+        Use kg_track_changes instead for file changes.
+        WHEN TO USE THIS TOOL:
+        ✅ Starting a new task or user request
+        ✅ User asks a question (to retrieve past context)
+        ✅ Resuming work on an existing project
+        ✅ Need to understand goals, constraints, preferences
+        WHEN NOT TO USE THIS TOOL:
+        ❌ After creating a file → use kg_track_changes
+        ❌ After modifying a file → use kg_track_changes
+        ❌ To "save" or "record" task completion → NOT NEEDED
+        ❌ To update goal status → NOT SUPPORTED HERE
+        It automatically:
+        1. Ingests and analyzes the user request (extracts goals, constraints, etc.)
+        2. Returns the full context pack with active goals, preferences, pain points
+        3. Optionally searches existing knowledge if search_query is provided
+        Args:
+            project_id: Project identifier (use workspace folder name)
+            user_text: The user's message or request
+            search_query: Optional query to search existing knowledge
+            files: Optional list of file paths involved
+            diff: Optional code diff
+            symbols: Optional list of code symbols
+            tags: Optional tags for categorization
+            k_hops: Graph traversal depth (1-5, default 2)
+        Returns:
+            markdown: Formatted context pack (READ THIS CAREFULLY)
+            interaction_id: ID of the ingested interaction
+            extracted: Extracted entities (goals, constraints, etc.)
+            search_results: Search results if search_query was provided
+        """
+        logger.info(f"kg_autopilot called for project {project_id}")
+        result: Dict[str, Any] = {
+            "markdown": "",
+            "interaction_id": None,
+            "extracted": {},
+            "search_results": [],
+        }
+        try:
+            # Step 1: Ingest the message
+            pipeline = get_ingest_pipeline()
+            ingest_result = await pipeline.process_message(
+                project_id=project_id,
+                user_text=user_text,
+                files=files,
+                diff=diff,
+                symbols=symbols,
+                tags=tags,
+            )
+            result["interaction_id"] = ingest_result.get("interaction_id")
+            result["extracted"] = ingest_result.get("extracted", {})
+            # Step 2: Build context pack
+            builder = get_context_builder()
+            context_result = await builder.build_context_pack(
+                project_id=project_id,
+                query=search_query,
+                k_hops=k_hops,
+            )
+            result["markdown"] = context_result.get("markdown", "")
+            # Add reminder about kg_track_changes
+            result["markdown"] += "\n\n---\n*📝 REMINDER: Call `kg_track_changes` after EVERY file you create or modify to keep the knowledge graph updated.*"
+            result["entities"] = context_result.get("entities", {})
+            # Step 3: Optional search
+            if search_query:
+                repo = get_repository()
+                search_results = await repo.fulltext_search(
+                    project_id=project_id,
+                    query=search_query,
+                    limit=10,
+                )
+                result["search_results"] = search_results
+            return serialize_response(result)
+        except Exception as e:
+            logger.error(f"kg_autopilot failed: {e}")
+            result["error"] = str(e)
+            result["markdown"] = f"# Error\n\nFailed to build context: {e}"
+            return result
+    @mcp.tool()
+    async def kg_track_changes(
+        project_id: str,
+        changes: List[Dict[str, Any]],
+        check_impact: bool = True,
+    ) -> Dict[str, Any]:
+        """
+        🔗 CALL THIS TOOL AFTER EVERY FILE MODIFICATION.
+        ⚠️ DO NOT use kg_autopilot for tracking file changes!
+        ═══════════════════════════════════════════════════════════════════════════
+        REQUIRED INPUT FORMAT
+        ═══════════════════════════════════════════════════════════════════════════
+        Each item in `changes` must be a dict with this structure:
+        {
+            "path": "/absolute/path/to/file.py",              # REQUIRED
+            "change_type": "created" | "modified" | "deleted", # REQUIRED
+            "language": "python",                             # Optional, auto-detected
+            "symbols": [                                      # Optional but RECOMMENDED
+                {
+                    "name": "function_name",                  # e.g. "calculate_tax"
+                    "kind": "function" | "method" | "class",  # REQUIRED
+                    "line_start": 10,                         # REQUIRED
+                    "line_end": 25,                           # REQUIRED
+                    "signature": "def calculate_tax(...)",    # Optional
+                    "change_type": "added" | "modified" | "deleted"  # REQUIRED
+                }
+            ]
+        }
+        ═══════════════════════════════════════════════════════════════════════════
+        EXAMPLE CALLS
+        ═══════════════════════════════════════════════════════════════════════════
+        Example 1 - Creating a new file with a function:
+        ```
+        kg_track_changes(
+            project_id="my-project",
+            changes=[{
+                "path": "/project/src/utils.py",
+                "change_type": "created",
+                "symbols": [{
+                    "name": "format_currency",
+                    "kind": "function",
+                    "line_start": 1,
+                    "line_end": 15,
+                    "signature": "def format_currency(amount: float, currency: str = 'EUR') -> str",
+                    "change_type": "added"
+                }]
+            }]
+        )
+        ```
+        Example 2 - Modifying a class method:
+        ```
+        kg_track_changes(
+            project_id="my-project",
+            changes=[{
+                "path": "/project/src/services/auth.py",
+                "change_type": "modified",
+                "symbols": [{
+                    "name": "AuthService.validate_token",
+                    "kind": "method",
+                    "line_start": 45,
+                    "line_end": 78,
+                    "signature": "async def validate_token(self, token: str) -> bool",
+                    "change_type": "modified"
+                }]
+            }]
+        )
+        ```
+        Example 3 - Simple file tracking (no symbols):
+        ```
+        kg_track_changes(
+            project_id="my-project",
+            changes=[{"path": "/project/README.md", "change_type": "modified"}]
+        )
+        ```
+        ═══════════════════════════════════════════════════════════════════════════
+        WHAT THIS TOOL DOES
+        ═══════════════════════════════════════════════════════════════════════════
+        1. Creates/updates CodeArtifact node for each file
+        2. Creates Symbol nodes for each symbol, linked via CONTAINS relationship
+        3. AUTO-LINKS to ALL active goals (no need to specify goal IDs!)
+        4. Stores line ranges and signatures for semantic queries
+        5. Runs impact analysis to find affected tests/strategies
+        ═══════════════════════════════════════════════════════════════════════════
+        Args:
+            project_id: Project identifier (use workspace folder name)
+            changes: List of file changes with optional symbols (see format above)
+            check_impact: Whether to run impact analysis (default: True)
+        Returns:
+            artifacts_linked: Number of files tracked
+            symbols_linked: Number of symbols tracked
+            auto_linked_goals: Goals automatically linked
+            impact_analysis: Affected tests and strategies
+        """
+        logger.info(f"kg_track_changes called for {len(changes)} files")
+        if not changes:
+            return {
+                "error": "changes is required and cannot be empty",
+                "artifacts_linked": 0,
+                "symbols_linked": 0,
+                "impact_analysis": {},
+            }
+        result: Dict[str, Any] = {
+            "artifacts_linked": 0,
+            "symbols_linked": 0,
+            "linked_paths": [],
+            "linked_symbols": [],
+            "auto_linked_goals": [],
+            "impact_analysis": {},
+        }
+        try:
+            repo = get_repository()
+            # Step 1: Auto-link to active goals
+            try:
+                active_goals = await repo.get_active_goals(project_id)
+                related_goal_ids = [g["id"] for g in active_goals if g.get("id")]
+                result["auto_linked_goals"] = [
+                    {"id": g["id"], "title": g.get("title", "Unknown")}
+                    for g in active_goals if g.get("id")
+                ]
+                logger.info(f"Auto-linking to {len(related_goal_ids)} active goals")
+            except Exception as goal_error:
+                logger.warning(f"Could not fetch active goals: {goal_error}")
+                related_goal_ids = []
+            # Step 2: Process each file change
+            all_paths = []
+            for change in changes:
+                path = change.get("path")
+                if not path:
+                    logger.warning("Skipping change without path")
+                    continue
+                all_paths.append(path)
+                change_type = change.get("change_type", "modified")
+                language = change.get("language")
+                symbols = change.get("symbols", [])
+                try:
+                    # Create/update CodeArtifact
+                    artifact = await repo.upsert_code_artifact(
+                        project_id=project_id,
+                        path=path,
+                        kind="file",
+                        language=language,
+                        related_goal_ids=related_goal_ids,
+                    )
+                    artifact_id = artifact.get("id")
+                    result["artifacts_linked"] += 1
+                    result["linked_paths"].append(path)
+                    # Create symbols if provided
+                    if artifact_id and symbols:
+                        for sym in symbols:
+                            sym_name = sym.get("name")
+                            if not sym_name:
+                                continue
+                            # Generate FQN: path:symbol_name
+                            fqn = f"{path}:{sym_name}"
+                            await repo.upsert_symbol(
+                                artifact_id=artifact_id,
+                                fqn=fqn,
+                                name=sym_name,
+                                kind=sym.get("kind", "function"),
+                                line_start=sym.get("line_start"),
+                                line_end=sym.get("line_end"),
+                                signature=sym.get("signature"),
+                                change_type=sym.get("change_type", "modified"),
+                            )
+                            result["symbols_linked"] += 1
+                            result["linked_symbols"].append({
+                                "fqn": fqn,
+                                "name": sym_name,
+                                "kind": sym.get("kind"),
+                                "lines": f"{sym.get('line_start')}-{sym.get('line_end')}",
+                            })
+                except Exception as link_error:
+                    logger.warning(f"Failed to link {path}: {link_error}")
+            # Step 3: Impact analysis
+            if check_impact and all_paths:
+                impact = await repo.get_impact_for_artifacts(project_id, all_paths)
+                result["impact_analysis"] = impact
+            return serialize_response(result)
+        except Exception as e:
+            logger.error(f"kg_track_changes failed: {e}")
+            result["error"] = str(e)
+            return result
+    logger.info("MCP tools registered: kg_autopilot, kg_track_changes (2 tools only)")

kg_mcp/security/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""
+Security submodule for authentication and authorization.
+"""

kg_mcp/security/auth.py ADDED Viewed

@@ -0,0 +1,121 @@
+"""
+Authentication middleware for MCP server.
+Validates Bearer tokens for incoming requests.
+"""
+import logging
+from typing import Callable, Optional
+from kg_mcp.config import get_settings
+logger = logging.getLogger(__name__)
+class AuthenticationError(Exception):
+    """Raised when authentication fails."""
+    pass
+def validate_bearer_token(token: str) -> bool:
+    """
+    Validate a bearer token against the configured token.
+    Args:
+        token: The token to validate
+    Returns:
+        True if valid, False otherwise
+    """
+    settings = get_settings()
+    if not settings.kg_mcp_token:
+        # No token configured - authentication disabled
+        logger.warning("No authentication token configured - all requests allowed")
+        return True
+    return token == settings.kg_mcp_token
+def extract_bearer_token(authorization_header: Optional[str]) -> Optional[str]:
+    """
+    Extract the bearer token from an Authorization header.
+    Args:
+        authorization_header: The full Authorization header value
+    Returns:
+        The token if present and properly formatted, None otherwise
+    """
+    if not authorization_header:
+        return None
+    parts = authorization_header.split()
+    if len(parts) != 2:
+        return None
+    scheme, token = parts
+    if scheme.lower() != "bearer":
+        return None
+    return token
+def create_auth_middleware() -> Callable:
+    """
+    Create an authentication middleware function.
+    Returns:
+        A middleware function that validates requests
+    """
+    async def auth_middleware(request, call_next):
+        """Middleware to check authentication on all requests."""
+        settings = get_settings()
+        # Skip auth if no token configured
+        if not settings.kg_mcp_token:
+            return await call_next(request)
+        # Extract and validate token
+        auth_header = request.headers.get("authorization")
+        token = extract_bearer_token(auth_header)
+        if not token:
+            logger.warning(f"Missing or invalid Authorization header from {request.client.host}")
+            # Return 401 Unauthorized
+            from starlette.responses import JSONResponse
+            return JSONResponse(
+                status_code=401,
+                content={"error": "Missing or invalid Authorization header"},
+            )
+        if not validate_bearer_token(token):
+            logger.warning(f"Invalid token from {request.client.host}")
+            return JSONResponse(
+                status_code=403,
+                content={"error": "Invalid authentication token"},
+            )
+        return await call_next(request)
+    return auth_middleware
+def require_auth(func: Callable) -> Callable:
+    """
+    Decorator to require authentication for a function.
+    This is a simple decorator for individual functions,
+    not for use with the full middleware system.
+    """
+    import functools
+    @functools.wraps(func)
+    async def wrapper(*args, **kwargs):
+        # In the context of MCP tools, auth is handled at the transport level
+        # This decorator is a placeholder for additional auth checks if needed
+        return await func(*args, **kwargs)
+    return wrapper