PyPI - roma-debug - Versions diffs - 0.1.0__py3-none-any.whl - Mend

roma-debug 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

roma_debug/__init__.py +3 -0
roma_debug/config.py +79 -0
roma_debug/core/__init__.py +5 -0
roma_debug/core/engine.py +423 -0
roma_debug/core/models.py +313 -0
roma_debug/main.py +753 -0
roma_debug/parsers/__init__.py +21 -0
roma_debug/parsers/base.py +189 -0
roma_debug/parsers/python_ast_parser.py +268 -0
roma_debug/parsers/registry.py +196 -0
roma_debug/parsers/traceback_patterns.py +314 -0
roma_debug/parsers/treesitter_parser.py +598 -0
roma_debug/prompts.py +153 -0
roma_debug/server.py +247 -0
roma_debug/tracing/__init__.py +28 -0
roma_debug/tracing/call_chain.py +278 -0
roma_debug/tracing/context_builder.py +672 -0
roma_debug/tracing/dependency_graph.py +298 -0
roma_debug/tracing/error_analyzer.py +399 -0
roma_debug/tracing/import_resolver.py +315 -0
roma_debug/tracing/project_scanner.py +569 -0
roma_debug/utils/__init__.py +5 -0
roma_debug/utils/context.py +422 -0
roma_debug-0.1.0.dist-info/METADATA +34 -0
roma_debug-0.1.0.dist-info/RECORD +36 -0
roma_debug-0.1.0.dist-info/WHEEL +5 -0
roma_debug-0.1.0.dist-info/entry_points.txt +2 -0
roma_debug-0.1.0.dist-info/licenses/LICENSE +201 -0
roma_debug-0.1.0.dist-info/top_level.txt +2 -0
tests/__init__.py +1 -0
tests/test_context.py +208 -0
tests/test_engine.py +296 -0
tests/test_parsers.py +534 -0
tests/test_project_scanner.py +275 -0
tests/test_traceback_patterns.py +222 -0
tests/test_tracing.py +296 -0

roma_debug/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""ROMA Debug - Standalone CLI debugging tool."""
+__version__ = "0.1.0"

roma_debug/config.py ADDED Viewed

@@ -0,0 +1,79 @@
+"""Centralized configuration for ROMA Debug.
+This module is the single source of truth for all configuration.
+It loads the .env file once at import time and exposes validated settings.
+"""
+import os
+from pathlib import Path
+from dotenv import load_dotenv
+def _find_project_root() -> Path:
+    """Find project root by searching for .env file.
+    Searches upward from this file's location until .env is found.
+    Falls back to the parent of roma_debug package.
+    Returns:
+        Path to project root directory
+    """
+    current = Path(__file__).resolve().parent
+    # Search upward for .env file (max 5 levels)
+    for _ in range(5):
+        if (current / ".env").exists():
+            return current
+        if current.parent == current:
+            break
+        current = current.parent
+    # Fallback: assume project root is parent of roma_debug/
+    return Path(__file__).resolve().parent.parent
+def _load_config() -> str:
+    """Load configuration from .env file.
+    Returns:
+        The Gemini API key
+    Raises:
+        RuntimeError: If GEMINI_API_KEY is not set
+    """
+    project_root = _find_project_root()
+    env_path = project_root / ".env"
+    # Load .env file
+    if env_path.exists():
+        load_dotenv(env_path, override=True)
+    else:
+        # Try loading from environment anyway
+        load_dotenv()
+    # Get API key from environment
+    api_key = os.environ.get("GEMINI_API_KEY") or os.environ.get("GOOGLE_API_KEY")
+    if not api_key:
+        raise RuntimeError(
+            f"GEMINI_API_KEY not found!\n"
+            f"Searched .env at: {env_path}\n"
+            f"Please set GEMINI_API_KEY in your .env file or environment."
+        )
+    return api_key
+# Load configuration at import time
+# This ensures consistent behavior across CLI and server
+GEMINI_API_KEY: str = _load_config()
+def get_api_key_status() -> str:
+    """Get human-readable API key status for logging.
+    Returns:
+        'OK' if key is loaded, 'MISSING' otherwise
+    """
+    return "OK" if GEMINI_API_KEY else "MISSING"

roma_debug/core/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""Core modules for ROMA Debug."""
+from roma_debug.core.engine import analyze_error
+__all__ = ["analyze_error"]

roma_debug/core/engine.py ADDED Viewed

@@ -0,0 +1,423 @@
+"""Gemini Fixer Logic for ROMA Debug.
+Returns structured JSON responses for machine-readable fixes.
+Supports both V1 (simple) and V2 (deep debugging) modes.
+"""
+import json
+import re
+import time
+from dataclasses import dataclass, field
+from typing import Optional, List
+from google import genai
+from google.genai import types
+from roma_debug.config import GEMINI_API_KEY
+from roma_debug.prompts import SYSTEM_PROMPT, SYSTEM_PROMPT_V2
+# Model priority: try Lite first (higher quota), then Flash
+PRIMARY_MODEL = "gemini-2.5-flash-lite"
+FALLBACK_MODEL = "gemini-2.5-flash"
+# Placeholder paths that indicate the AI couldn't determine the real path
+INVALID_PATHS = {
+    "unknown",
+    "path/to/file.py",
+    "path/to/your/code.py",
+    "path/to/your/file.py",
+    "example.py",
+    "your_file.py",
+    "file.py",
+    "",
+}
+@dataclass
+class FixResult:
+    """Structured result from the AI engine."""
+    filepath: Optional[str]  # None for general system errors
+    full_code_block: str
+    explanation: str
+    raw_response: str
+    model_used: str
+    def to_dict(self) -> dict:
+        """Convert to dictionary."""
+        return {
+            "filepath": self.filepath,
+            "full_code_block": self.full_code_block,
+            "explanation": self.explanation,
+        }
+@dataclass
+class AdditionalFix:
+    """An additional fix for another file."""
+    filepath: str
+    full_code_block: str
+    explanation: str
+@dataclass
+class FixResultV2(FixResult):
+    """V2 result with root cause analysis and multiple fixes."""
+    root_cause_file: Optional[str] = None
+    root_cause_explanation: Optional[str] = None
+    additional_fixes: List[AdditionalFix] = field(default_factory=list)
+    def to_dict(self) -> dict:
+        """Convert to dictionary."""
+        result = super().to_dict()
+        result["root_cause_file"] = self.root_cause_file
+        result["root_cause_explanation"] = self.root_cause_explanation
+        result["additional_fixes"] = [
+            {
+                "filepath": fix.filepath,
+                "full_code_block": fix.full_code_block,
+                "explanation": fix.explanation,
+            }
+            for fix in self.additional_fixes
+        ]
+        return result
+    @property
+    def has_root_cause(self) -> bool:
+        """Check if a root cause in a different file was identified."""
+        return bool(self.root_cause_file and self.root_cause_file != self.filepath)
+    @property
+    def all_files_to_fix(self) -> List[str]:
+        """Get list of all files that need fixes."""
+        files = []
+        if self.filepath:
+            files.append(self.filepath)
+        if self.root_cause_file and self.root_cause_file not in files:
+            files.append(self.root_cause_file)
+        for fix in self.additional_fixes:
+            if fix.filepath not in files:
+                files.append(fix.filepath)
+        return files
+def _get_client() -> genai.Client:
+    """Get configured Gemini client."""
+    return genai.Client(api_key=GEMINI_API_KEY)
+def _normalize_filepath(filepath: Optional[str]) -> Optional[str]:
+    """Normalize filepath, returning None for invalid/placeholder paths.
+    Args:
+        filepath: Raw filepath from AI response
+    Returns:
+        Validated filepath or None if invalid
+    """
+    if filepath is None:
+        return None
+    # Convert to string and strip whitespace
+    filepath = str(filepath).strip()
+    # Check against known invalid placeholders
+    if filepath.lower() in INVALID_PATHS:
+        return None
+    # Check for placeholder patterns
+    placeholder_patterns = [
+        r"^path/to/",
+        r"^your[_-]",
+        r"^example[_-]?",
+        r"<.*>",  # <filename> style placeholders
+    ]
+    for pattern in placeholder_patterns:
+        if re.match(pattern, filepath, re.IGNORECASE):
+            return None
+    return filepath
+def _parse_json_response(text: str) -> dict:
+    """Parse JSON from response, handling markdown code blocks.
+    Args:
+        text: Raw response text
+    Returns:
+        Parsed JSON dict
+    Raises:
+        ValueError: If JSON parsing fails
+    """
+    # Try direct JSON parse first
+    try:
+        return json.loads(text)
+    except json.JSONDecodeError:
+        pass
+    # Try extracting from markdown code block
+    json_match = re.search(r'```(?:json)?\s*\n?(.*?)\n?```', text, re.DOTALL)
+    if json_match:
+        try:
+            return json.loads(json_match.group(1))
+        except json.JSONDecodeError:
+            pass
+    # Try finding JSON object in text
+    json_match = re.search(r'\{[\s\S]*\}', text)
+    if json_match:
+        try:
+            return json.loads(json_match.group(0))
+        except json.JSONDecodeError:
+            pass
+    raise ValueError(f"Could not parse JSON from response: {text[:200]}...")
+def analyze_error(log: str, context: str, max_retries: int = 3) -> FixResult:
+    """Analyze an error log and return a structured code fix.
+    Args:
+        log: The error log or traceback
+        context: Source code context around the error
+        max_retries: Number of retries for rate limit errors
+    Returns:
+        FixResult with structured fix data (filepath may be None for general errors)
+    Raises:
+        Exception: If Gemini API call fails after retries
+    """
+    client = _get_client()
+    user_prompt = _build_prompt(log, context)
+    full_prompt = f"{SYSTEM_PROMPT}\n\n{user_prompt}"
+    # Configure for JSON output
+    generation_config = types.GenerateContentConfig(
+        temperature=0,
+        response_mime_type="application/json",
+    )
+    models_to_try = [PRIMARY_MODEL, FALLBACK_MODEL]
+    last_error = None
+    for model_name in models_to_try:
+        for attempt in range(max_retries):
+            try:
+                response = client.models.generate_content(
+                    model=model_name,
+                    contents=full_prompt,
+                    config=generation_config,
+                )
+                raw_text = response.text
+                # Parse JSON response
+                try:
+                    parsed = _parse_json_response(raw_text)
+                except ValueError:
+                    # If JSON parsing fails, create a basic structure
+                    parsed = {
+                        "filepath": None,
+                        "full_code_block": raw_text,
+                        "explanation": "AI returned non-JSON response. Raw output provided.",
+                    }
+                # Normalize and validate filepath
+                raw_filepath = parsed.get("filepath")
+                normalized_filepath = _normalize_filepath(raw_filepath)
+                return FixResult(
+                    filepath=normalized_filepath,
+                    full_code_block=parsed.get("full_code_block", ""),
+                    explanation=parsed.get("explanation", ""),
+                    raw_response=raw_text,
+                    model_used=model_name,
+                )
+            except Exception as e:
+                error_str = str(e).lower()
+                last_error = e
+                is_quota_error = any(x in error_str for x in [
+                    "429", "quota", "rate limit", "resource exhausted"
+                ])
+                if is_quota_error:
+                    if model_name == PRIMARY_MODEL:
+                        break  # Try fallback model
+                    wait_time = (2 ** attempt) * 5
+                    if attempt < max_retries - 1:
+                        time.sleep(wait_time)
+                        continue
+                raise
+        if model_name == PRIMARY_MODEL and last_error:
+            continue
+    raise last_error
+def analyze_error_v2(
+    log: str,
+    context: str,
+    max_retries: int = 3,
+    include_upstream: bool = True,
+) -> FixResultV2:
+    """Analyze an error with V2 deep debugging (root cause analysis).
+    Args:
+        log: The error log or traceback
+        context: Source code context (should include upstream context for V2)
+        max_retries: Number of retries for rate limit errors
+        include_upstream: Whether upstream context was included
+    Returns:
+        FixResultV2 with root cause analysis and potentially multiple fixes
+    Raises:
+        Exception: If Gemini API call fails after retries
+    """
+    client = _get_client()
+    user_prompt = _build_prompt_v2(log, context)
+    full_prompt = f"{SYSTEM_PROMPT_V2}\n\n{user_prompt}"
+    # Configure for JSON output
+    generation_config = types.GenerateContentConfig(
+        temperature=0,
+        response_mime_type="application/json",
+    )
+    models_to_try = [PRIMARY_MODEL, FALLBACK_MODEL]
+    last_error = None
+    for model_name in models_to_try:
+        for attempt in range(max_retries):
+            try:
+                response = client.models.generate_content(
+                    model=model_name,
+                    contents=full_prompt,
+                    config=generation_config,
+                )
+                raw_text = response.text
+                # Parse JSON response
+                try:
+                    parsed = _parse_json_response(raw_text)
+                except ValueError:
+                    # If JSON parsing fails, create a basic structure
+                    parsed = {
+                        "filepath": None,
+                        "full_code_block": raw_text,
+                        "explanation": "AI returned non-JSON response. Raw output provided.",
+                    }
+                # Normalize filepaths
+                normalized_filepath = _normalize_filepath(parsed.get("filepath"))
+                root_cause_file = _normalize_filepath(parsed.get("root_cause_file"))
+                # Parse additional fixes
+                additional_fixes = []
+                for fix_data in parsed.get("additional_fixes", []):
+                    fix_path = _normalize_filepath(fix_data.get("filepath"))
+                    if fix_path:
+                        additional_fixes.append(AdditionalFix(
+                            filepath=fix_path,
+                            full_code_block=fix_data.get("full_code_block", ""),
+                            explanation=fix_data.get("explanation", ""),
+                        ))
+                return FixResultV2(
+                    filepath=normalized_filepath,
+                    full_code_block=parsed.get("full_code_block", ""),
+                    explanation=parsed.get("explanation", ""),
+                    raw_response=raw_text,
+                    model_used=model_name,
+                    root_cause_file=root_cause_file,
+                    root_cause_explanation=parsed.get("root_cause_explanation"),
+                    additional_fixes=additional_fixes,
+                )
+            except Exception as e:
+                error_str = str(e).lower()
+                last_error = e
+                is_quota_error = any(x in error_str for x in [
+                    "429", "quota", "rate limit", "resource exhausted"
+                ])
+                if is_quota_error:
+                    if model_name == PRIMARY_MODEL:
+                        break  # Try fallback model
+                    wait_time = (2 ** attempt) * 5
+                    if attempt < max_retries - 1:
+                        time.sleep(wait_time)
+                        continue
+                raise
+        if model_name == PRIMARY_MODEL and last_error:
+            continue
+    raise last_error
+def analyze_error_simple(log: str, context: str, max_retries: int = 3) -> str:
+    """Analyze error and return raw text (for backward compatibility).
+    Args:
+        log: The error log or traceback
+        context: Source code context around the error
+        max_retries: Number of retries for rate limit errors
+    Returns:
+        Raw text fix from Gemini
+    """
+    result = analyze_error(log, context, max_retries)
+    return result.full_code_block or result.raw_response
+def _build_prompt(log: str, context: str) -> str:
+    """Build the user prompt from log and context."""
+    parts = ["## ERROR LOG", log]
+    if context:
+        parts.extend(["", "## SOURCE CONTEXT", context])
+    parts.extend([
+        "",
+        "## INSTRUCTIONS",
+        "Analyze the error above. Return the corrected code as JSON.",
+        "The full_code_block should contain the complete fixed code, ready to replace the original.",
+        "If no specific file path is in the error traceback, set filepath to null.",
+    ])
+    return "\n".join(parts)
+def _build_prompt_v2(log: str, context: str) -> str:
+    """Build V2 prompt with upstream context support."""
+    parts = ["## ERROR LOG / TRACEBACK", log]
+    if context:
+        parts.extend(["", context])  # Context already formatted by ContextBuilder
+    parts.extend([
+        "",
+        "## INSTRUCTIONS",
+        "Analyze the error above with deep project understanding.",
+        "Consider the full call chain and upstream context to identify root causes.",
+        "Return the corrected code as JSON with root cause analysis if applicable.",
+        "If the bug originates in a different file, set root_cause_file and provide fixes for both.",
+        "If no specific file path is in the traceback, set filepath to null.",
+    ])
+    return "\n".join(parts)