PyPI - tree-sitter-analyzer - Versions diffs - 1.9.17.1__py3-none-any.whl - Mend

tree-sitter-analyzer 1.9.17.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (149) hide show

tree_sitter_analyzer/__init__.py +132 -0
tree_sitter_analyzer/__main__.py +11 -0
tree_sitter_analyzer/api.py +853 -0
tree_sitter_analyzer/cli/__init__.py +39 -0
tree_sitter_analyzer/cli/__main__.py +12 -0
tree_sitter_analyzer/cli/argument_validator.py +89 -0
tree_sitter_analyzer/cli/commands/__init__.py +26 -0
tree_sitter_analyzer/cli/commands/advanced_command.py +226 -0
tree_sitter_analyzer/cli/commands/base_command.py +181 -0
tree_sitter_analyzer/cli/commands/default_command.py +18 -0
tree_sitter_analyzer/cli/commands/find_and_grep_cli.py +188 -0
tree_sitter_analyzer/cli/commands/list_files_cli.py +133 -0
tree_sitter_analyzer/cli/commands/partial_read_command.py +139 -0
tree_sitter_analyzer/cli/commands/query_command.py +109 -0
tree_sitter_analyzer/cli/commands/search_content_cli.py +161 -0
tree_sitter_analyzer/cli/commands/structure_command.py +156 -0
tree_sitter_analyzer/cli/commands/summary_command.py +116 -0
tree_sitter_analyzer/cli/commands/table_command.py +414 -0
tree_sitter_analyzer/cli/info_commands.py +124 -0
tree_sitter_analyzer/cli_main.py +472 -0
tree_sitter_analyzer/constants.py +85 -0
tree_sitter_analyzer/core/__init__.py +15 -0
tree_sitter_analyzer/core/analysis_engine.py +580 -0
tree_sitter_analyzer/core/cache_service.py +333 -0
tree_sitter_analyzer/core/engine.py +585 -0
tree_sitter_analyzer/core/parser.py +293 -0
tree_sitter_analyzer/core/query.py +605 -0
tree_sitter_analyzer/core/query_filter.py +200 -0
tree_sitter_analyzer/core/query_service.py +340 -0
tree_sitter_analyzer/encoding_utils.py +530 -0
tree_sitter_analyzer/exceptions.py +747 -0
tree_sitter_analyzer/file_handler.py +246 -0
tree_sitter_analyzer/formatters/__init__.py +1 -0
tree_sitter_analyzer/formatters/base_formatter.py +201 -0
tree_sitter_analyzer/formatters/csharp_formatter.py +367 -0
tree_sitter_analyzer/formatters/formatter_config.py +197 -0
tree_sitter_analyzer/formatters/formatter_factory.py +84 -0
tree_sitter_analyzer/formatters/formatter_registry.py +377 -0
tree_sitter_analyzer/formatters/formatter_selector.py +96 -0
tree_sitter_analyzer/formatters/go_formatter.py +368 -0
tree_sitter_analyzer/formatters/html_formatter.py +498 -0
tree_sitter_analyzer/formatters/java_formatter.py +423 -0
tree_sitter_analyzer/formatters/javascript_formatter.py +611 -0
tree_sitter_analyzer/formatters/kotlin_formatter.py +268 -0
tree_sitter_analyzer/formatters/language_formatter_factory.py +123 -0
tree_sitter_analyzer/formatters/legacy_formatter_adapters.py +228 -0
tree_sitter_analyzer/formatters/markdown_formatter.py +725 -0
tree_sitter_analyzer/formatters/php_formatter.py +301 -0
tree_sitter_analyzer/formatters/python_formatter.py +830 -0
tree_sitter_analyzer/formatters/ruby_formatter.py +278 -0
tree_sitter_analyzer/formatters/rust_formatter.py +233 -0
tree_sitter_analyzer/formatters/sql_formatter_wrapper.py +689 -0
tree_sitter_analyzer/formatters/sql_formatters.py +536 -0
tree_sitter_analyzer/formatters/typescript_formatter.py +543 -0
tree_sitter_analyzer/formatters/yaml_formatter.py +462 -0
tree_sitter_analyzer/interfaces/__init__.py +9 -0
tree_sitter_analyzer/interfaces/cli.py +535 -0
tree_sitter_analyzer/interfaces/cli_adapter.py +359 -0
tree_sitter_analyzer/interfaces/mcp_adapter.py +224 -0
tree_sitter_analyzer/interfaces/mcp_server.py +428 -0
tree_sitter_analyzer/language_detector.py +553 -0
tree_sitter_analyzer/language_loader.py +271 -0
tree_sitter_analyzer/languages/__init__.py +10 -0
tree_sitter_analyzer/languages/csharp_plugin.py +1076 -0
tree_sitter_analyzer/languages/css_plugin.py +449 -0
tree_sitter_analyzer/languages/go_plugin.py +836 -0
tree_sitter_analyzer/languages/html_plugin.py +496 -0
tree_sitter_analyzer/languages/java_plugin.py +1299 -0
tree_sitter_analyzer/languages/javascript_plugin.py +1622 -0
tree_sitter_analyzer/languages/kotlin_plugin.py +656 -0
tree_sitter_analyzer/languages/markdown_plugin.py +1928 -0
tree_sitter_analyzer/languages/php_plugin.py +862 -0
tree_sitter_analyzer/languages/python_plugin.py +1636 -0
tree_sitter_analyzer/languages/ruby_plugin.py +757 -0
tree_sitter_analyzer/languages/rust_plugin.py +673 -0
tree_sitter_analyzer/languages/sql_plugin.py +2444 -0
tree_sitter_analyzer/languages/typescript_plugin.py +1892 -0
tree_sitter_analyzer/languages/yaml_plugin.py +695 -0
tree_sitter_analyzer/legacy_table_formatter.py +860 -0
tree_sitter_analyzer/mcp/__init__.py +34 -0
tree_sitter_analyzer/mcp/resources/__init__.py +43 -0
tree_sitter_analyzer/mcp/resources/code_file_resource.py +208 -0
tree_sitter_analyzer/mcp/resources/project_stats_resource.py +586 -0
tree_sitter_analyzer/mcp/server.py +869 -0
tree_sitter_analyzer/mcp/tools/__init__.py +28 -0
tree_sitter_analyzer/mcp/tools/analyze_scale_tool.py +779 -0
tree_sitter_analyzer/mcp/tools/analyze_scale_tool_cli_compatible.py +291 -0
tree_sitter_analyzer/mcp/tools/base_tool.py +139 -0
tree_sitter_analyzer/mcp/tools/fd_rg_utils.py +816 -0
tree_sitter_analyzer/mcp/tools/find_and_grep_tool.py +686 -0
tree_sitter_analyzer/mcp/tools/list_files_tool.py +413 -0
tree_sitter_analyzer/mcp/tools/output_format_validator.py +148 -0
tree_sitter_analyzer/mcp/tools/query_tool.py +443 -0
tree_sitter_analyzer/mcp/tools/read_partial_tool.py +464 -0
tree_sitter_analyzer/mcp/tools/search_content_tool.py +836 -0
tree_sitter_analyzer/mcp/tools/table_format_tool.py +572 -0
tree_sitter_analyzer/mcp/tools/universal_analyze_tool.py +653 -0
tree_sitter_analyzer/mcp/utils/__init__.py +113 -0
tree_sitter_analyzer/mcp/utils/error_handler.py +569 -0
tree_sitter_analyzer/mcp/utils/file_output_factory.py +217 -0
tree_sitter_analyzer/mcp/utils/file_output_manager.py +322 -0
tree_sitter_analyzer/mcp/utils/gitignore_detector.py +358 -0
tree_sitter_analyzer/mcp/utils/path_resolver.py +414 -0
tree_sitter_analyzer/mcp/utils/search_cache.py +343 -0
tree_sitter_analyzer/models.py +840 -0
tree_sitter_analyzer/mypy_current_errors.txt +2 -0
tree_sitter_analyzer/output_manager.py +255 -0
tree_sitter_analyzer/platform_compat/__init__.py +3 -0
tree_sitter_analyzer/platform_compat/adapter.py +324 -0
tree_sitter_analyzer/platform_compat/compare.py +224 -0
tree_sitter_analyzer/platform_compat/detector.py +67 -0
tree_sitter_analyzer/platform_compat/fixtures.py +228 -0
tree_sitter_analyzer/platform_compat/profiles.py +217 -0
tree_sitter_analyzer/platform_compat/record.py +55 -0
tree_sitter_analyzer/platform_compat/recorder.py +155 -0
tree_sitter_analyzer/platform_compat/report.py +92 -0
tree_sitter_analyzer/plugins/__init__.py +280 -0
tree_sitter_analyzer/plugins/base.py +647 -0
tree_sitter_analyzer/plugins/manager.py +384 -0
tree_sitter_analyzer/project_detector.py +328 -0
tree_sitter_analyzer/queries/__init__.py +27 -0
tree_sitter_analyzer/queries/csharp.py +216 -0
tree_sitter_analyzer/queries/css.py +615 -0
tree_sitter_analyzer/queries/go.py +275 -0
tree_sitter_analyzer/queries/html.py +543 -0
tree_sitter_analyzer/queries/java.py +402 -0
tree_sitter_analyzer/queries/javascript.py +724 -0
tree_sitter_analyzer/queries/kotlin.py +192 -0
tree_sitter_analyzer/queries/markdown.py +258 -0
tree_sitter_analyzer/queries/php.py +95 -0
tree_sitter_analyzer/queries/python.py +859 -0
tree_sitter_analyzer/queries/ruby.py +92 -0
tree_sitter_analyzer/queries/rust.py +223 -0
tree_sitter_analyzer/queries/sql.py +555 -0
tree_sitter_analyzer/queries/typescript.py +871 -0
tree_sitter_analyzer/queries/yaml.py +236 -0
tree_sitter_analyzer/query_loader.py +272 -0
tree_sitter_analyzer/security/__init__.py +22 -0
tree_sitter_analyzer/security/boundary_manager.py +277 -0
tree_sitter_analyzer/security/regex_checker.py +297 -0
tree_sitter_analyzer/security/validator.py +599 -0
tree_sitter_analyzer/table_formatter.py +782 -0
tree_sitter_analyzer/utils/__init__.py +53 -0
tree_sitter_analyzer/utils/logging.py +433 -0
tree_sitter_analyzer/utils/tree_sitter_compat.py +289 -0
tree_sitter_analyzer-1.9.17.1.dist-info/METADATA +485 -0
tree_sitter_analyzer-1.9.17.1.dist-info/RECORD +149 -0
tree_sitter_analyzer-1.9.17.1.dist-info/WHEEL +4 -0
tree_sitter_analyzer-1.9.17.1.dist-info/entry_points.txt +25 -0

tree_sitter_analyzer/api.py ADDED Viewed

@@ -0,0 +1,853 @@
+#!/usr/bin/env python3
+"""
+Tree-sitter Analyzer API
+Public API facade that provides a stable, high-level interface to the
+tree-sitter analyzer framework. This is the main entry point for both
+CLI and MCP interfaces.
+"""
+import logging
+from pathlib import Path
+from typing import Any
+from . import __version__
+from .core.engine import AnalysisEngine
+from .utils import log_error
+logger = logging.getLogger(__name__)
+# Global engine instance (singleton pattern)
+_engine: AnalysisEngine | None = None
+def get_engine() -> AnalysisEngine:
+    """
+    Get the global analysis engine instance.
+    Returns:
+        AnalysisEngine instance
+    """
+    global _engine
+    if _engine is None:
+        _engine = AnalysisEngine()
+    return _engine
+def analyze_file(
+    file_path: str | Path,
+    language: str | None = None,
+    queries: list[str] | None = None,
+    include_elements: bool = True,
+    include_details: bool = False,  # Add for backward compatibility
+    include_queries: bool = True,
+    include_complexity: bool = False,  # Add for backward compatibility
+) -> dict[str, Any]:
+    """
+    Analyze a source code file.
+    This is the main high-level function for file analysis. It handles
+    language detection, parsing, query execution, and element extraction.
+    Args:
+        file_path: Path to the source file to analyze
+        language: Programming language (auto-detected if not specified)
+        queries: List of query names to execute (all available if not specified)
+        include_elements: Whether to extract code elements
+        include_queries: Whether to execute queries
+        include_complexity: Whether to include complexity metrics (backward compatibility)
+    Returns:
+        Analysis results dictionary
+    """
+    try:
+        engine = get_engine()
+        # Perform the analysis
+        analysis_result = engine.analyze_file(file_path, language, queries=queries)
+        # Convert AnalysisResult to expected API format (same as analyze_code)
+        result = {
+            "success": analysis_result.success,
+            "file_info": {
+                "path": str(file_path),
+                "exists": True,
+            },
+            "language_info": {
+                "language": analysis_result.language,
+                "detected": language is None,  # True if language was auto-detected
+            },
+            "ast_info": {
+                "node_count": analysis_result.node_count,
+                "line_count": analysis_result.line_count,
+            },
+        }
+        # Add elements if requested and available
+        if include_elements and hasattr(analysis_result, "elements"):
+            elements_list: list[dict[str, Any]] = []
+            result["elements"] = elements_list
+            for elem in analysis_result.elements:
+                elem_dict = {
+                    "name": elem.name,
+                    "type": type(elem).__name__.lower(),
+                    "start_line": elem.start_line,
+                    "end_line": elem.end_line,
+                    "raw_text": elem.raw_text,
+                    "language": elem.language,
+                }
+                # Add type-specific fields
+                if hasattr(elem, "module_path"):
+                    elem_dict["module_path"] = elem.module_path
+                if hasattr(elem, "module_name"):
+                    elem_dict["module_name"] = elem.module_name
+                if hasattr(elem, "imported_names"):
+                    elem_dict["imported_names"] = elem.imported_names
+                if hasattr(elem, "variable_type"):
+                    elem_dict["variable_type"] = elem.variable_type
+                if hasattr(elem, "initializer"):
+                    elem_dict["initializer"] = elem.initializer
+                if hasattr(elem, "is_constant"):
+                    elem_dict["is_constant"] = elem.is_constant
+                if hasattr(elem, "parameters"):
+                    elem_dict["parameters"] = elem.parameters
+                if hasattr(elem, "return_type"):
+                    elem_dict["return_type"] = elem.return_type
+                if hasattr(elem, "is_async"):
+                    elem_dict["is_async"] = elem.is_async
+                if hasattr(elem, "is_static"):
+                    elem_dict["is_static"] = elem.is_static
+                if hasattr(elem, "is_constructor"):
+                    elem_dict["is_constructor"] = elem.is_constructor
+                if hasattr(elem, "is_method"):
+                    elem_dict["is_method"] = elem.is_method
+                if hasattr(elem, "complexity_score"):
+                    elem_dict["complexity_score"] = elem.complexity_score
+                if hasattr(elem, "superclass"):
+                    elem_dict["superclass"] = elem.superclass
+                if hasattr(elem, "class_type"):
+                    elem_dict["class_type"] = elem.class_type
+                # For methods, try to find the class name from context
+                if elem_dict.get("is_method") and elem_dict["type"] == "function":
+                    # Look for the class this method belongs to
+                    for other_elem in analysis_result.elements:
+                        if (
+                            hasattr(other_elem, "start_line")
+                            and hasattr(other_elem, "end_line")
+                            and type(other_elem).__name__.lower() == "class"
+                            and other_elem.start_line
+                            <= elem.start_line
+                            <= other_elem.end_line
+                        ):
+                            elem_dict["class_name"] = other_elem.name
+                            break
+                    else:
+                        elem_dict["class_name"] = None
+                elements_list.append(elem_dict)
+        # Add query results if requested and available
+        if include_queries and hasattr(analysis_result, "query_results"):
+            result["query_results"] = analysis_result.query_results
+        # Add error message if analysis failed
+        if not analysis_result.success and analysis_result.error_message:
+            result["error"] = analysis_result.error_message
+        # Filter results based on options
+        if not include_elements and "elements" in result:
+            del result["elements"]
+        if not include_queries and "query_results" in result:
+            del result["query_results"]
+        return result
+    except FileNotFoundError as e:
+        # Re-raise FileNotFoundError for tests that expect it
+        raise e
+    except Exception as e:
+        log_error(f"API analyze_file failed: {e}")
+        return {
+            "success": False,
+            "error": str(e),
+            "file_info": {"path": str(file_path), "exists": False},
+            "language_info": {"language": language or "unknown", "detected": False},
+            "ast_info": {"node_count": 0, "line_count": 0},
+        }
+def analyze_code(
+    source_code: str,
+    language: str,
+    queries: list[str] | None = None,
+    include_elements: bool = True,
+    include_queries: bool = True,
+) -> dict[str, Any]:
+    """
+    Analyze source code directly (without file).
+    Args:
+        source_code: Source code string to analyze
+        language: Programming language
+        queries: List of query names to execute (all available if not specified)
+        include_elements: Whether to extract code elements
+        include_queries: Whether to execute queries
+    Returns:
+        Analysis results dictionary
+    """
+    try:
+        engine = get_engine()
+        # Perform the analysis
+        analysis_result = engine.analyze_code(source_code, language)
+        # Convert AnalysisResult to expected API format
+        result = {
+            "success": analysis_result.success,
+            "language_info": {
+                "language": analysis_result.language,
+                "detected": False,  # Language was explicitly provided
+            },
+            "ast_info": {
+                "node_count": analysis_result.node_count,
+                "line_count": analysis_result.line_count,
+            },
+        }
+        # Add elements if requested and available
+        if include_elements and hasattr(analysis_result, "elements"):
+            elements_list: list[dict[str, Any]] = []
+            result["elements"] = elements_list
+            for elem in analysis_result.elements:
+                elem_dict = {
+                    "name": elem.name,
+                    "type": type(elem).__name__.lower(),
+                    "start_line": elem.start_line,
+                    "end_line": elem.end_line,
+                    "raw_text": elem.raw_text,
+                    "language": elem.language,
+                }
+                # Add type-specific fields
+                if hasattr(elem, "module_path"):
+                    elem_dict["module_path"] = elem.module_path
+                if hasattr(elem, "module_name"):
+                    elem_dict["module_name"] = elem.module_name
+                if hasattr(elem, "imported_names"):
+                    elem_dict["imported_names"] = elem.imported_names
+                if hasattr(elem, "variable_type"):
+                    elem_dict["variable_type"] = elem.variable_type
+                if hasattr(elem, "initializer"):
+                    elem_dict["initializer"] = elem.initializer
+                if hasattr(elem, "is_constant"):
+                    elem_dict["is_constant"] = elem.is_constant
+                if hasattr(elem, "parameters"):
+                    elem_dict["parameters"] = elem.parameters
+                if hasattr(elem, "return_type"):
+                    elem_dict["return_type"] = elem.return_type
+                if hasattr(elem, "is_async"):
+                    elem_dict["is_async"] = elem.is_async
+                if hasattr(elem, "is_static"):
+                    elem_dict["is_static"] = elem.is_static
+                if hasattr(elem, "is_constructor"):
+                    elem_dict["is_constructor"] = elem.is_constructor
+                if hasattr(elem, "is_method"):
+                    elem_dict["is_method"] = elem.is_method
+                if hasattr(elem, "complexity_score"):
+                    elem_dict["complexity_score"] = elem.complexity_score
+                if hasattr(elem, "superclass"):
+                    elem_dict["superclass"] = elem.superclass
+                if hasattr(elem, "class_type"):
+                    elem_dict["class_type"] = elem.class_type
+                # For methods, try to find the class name from context
+                if elem_dict.get("is_method") and elem_dict["type"] == "function":
+                    # Look for the class this method belongs to
+                    for other_elem in analysis_result.elements:
+                        if (
+                            hasattr(other_elem, "start_line")
+                            and hasattr(other_elem, "end_line")
+                            and type(other_elem).__name__.lower() == "class"
+                            and other_elem.start_line
+                            <= elem.start_line
+                            <= other_elem.end_line
+                        ):
+                            elem_dict["class_name"] = other_elem.name
+                            break
+                    else:
+                        elem_dict["class_name"] = None
+                elements_list.append(elem_dict)
+        # Add query results if requested and available
+        if include_queries and hasattr(analysis_result, "query_results"):
+            result["query_results"] = analysis_result.query_results
+        # Add error message if analysis failed
+        if not analysis_result.success and analysis_result.error_message:
+            result["error"] = analysis_result.error_message
+        # Filter results based on options
+        if not include_elements and "elements" in result:
+            del result["elements"]
+        if not include_queries and "query_results" in result:
+            del result["query_results"]
+        return result
+    except Exception as e:
+        log_error(f"API analyze_code failed: {e}")
+        return {"success": False, "error": str(e)}
+def get_supported_languages() -> list[str]:
+    """
+    Get list of all supported programming languages.
+    Returns:
+        List of supported language names
+    """
+    try:
+        engine = get_engine()
+        return engine.get_supported_languages()
+    except Exception as e:
+        log_error(f"Failed to get supported languages: {e}")
+        return []
+def get_available_queries(language: str) -> list[str]:
+    """
+    Get available queries for a specific language.
+    Args:
+        language: Programming language name
+    Returns:
+        List of available query names
+    """
+    try:
+        engine = get_engine()
+        # Try to get plugin and its supported queries
+        plugin = engine._get_language_plugin(language)
+        if plugin and hasattr(plugin, "get_supported_queries"):
+            result = plugin.get_supported_queries()
+            return list(result) if result else []
+        else:
+            # Return default queries
+            return ["class", "method", "field"]
+    except Exception as e:
+        log_error(f"Failed to get available queries for {language}: {e}")
+        return []
+def is_language_supported(language: str) -> bool:
+    """
+    Check if a programming language is supported.
+    Args:
+        language: Programming language name
+    Returns:
+        True if the language is supported
+    """
+    try:
+        supported_languages = get_supported_languages()
+        return language.lower() in [lang.lower() for lang in supported_languages]
+    except Exception as e:
+        log_error(f"Failed to check language support for {language}: {e}")
+        return False
+def detect_language(file_path: str | Path) -> str:
+    """
+    Detect programming language from file path.
+    Args:
+        file_path: Path to the file
+    Returns:
+        Detected language name - 常に有効な文字列を返す
+    """
+    try:
+        # Handle invalid input
+        if not file_path:
+            return "unknown"
+        engine = get_engine()
+        # Use language_detector instead of language_registry
+        result = engine.language_detector.detect_from_extension(str(file_path))
+        # Ensure result is valid
+        if not result or result.strip() == "":
+            return "unknown"
+        return result
+    except Exception as e:
+        log_error(f"Failed to detect language for {file_path}: {e}")
+        return "unknown"
+def get_file_extensions(language: str) -> list[str]:
+    """
+    Get file extensions for a specific language.
+    Args:
+        language: Programming language name
+    Returns:
+        List of file extensions
+    """
+    try:
+        engine = get_engine()
+        # Use language_detector to get extensions
+        if hasattr(engine.language_detector, "get_extensions_for_language"):
+            result = engine.language_detector.get_extensions_for_language(language)
+            return list(result) if result else []
+        else:
+            # Fallback: return common extensions
+            extension_map = {
+                "java": [".java"],
+                "python": [".py"],
+                "javascript": [".js"],
+                "typescript": [".ts"],
+                "c": [".c"],
+                "cpp": [".cpp", ".cxx", ".cc"],
+                "go": [".go"],
+                "rust": [".rs"],
+            }
+            return extension_map.get(language.lower(), [])
+    except Exception as e:
+        log_error(f"Failed to get extensions for {language}: {e}")
+        return []
+def validate_file(file_path: str | Path) -> dict[str, Any]:
+    """
+    Validate a source code file without full analysis.
+    Args:
+        file_path: Path to the file to validate
+    Returns:
+        Validation results dictionary
+    """
+    file_path = Path(file_path)
+    result: dict[str, Any] = {
+        "valid": False,
+        "exists": file_path.exists(),
+        "readable": False,
+        "language": None,
+        "supported": False,
+        "size": 0,
+        "errors": [],
+    }
+    try:
+        # Check if file exists
+        if not file_path.exists():
+            result["errors"].append("File does not exist")
+            return result
+        # Check if file is readable
+        try:
+            from .encoding_utils import read_file_safe
+            # Test file readability by reading it
+            read_file_safe(file_path)
+            result["readable"] = True
+            result["size"] = file_path.stat().st_size
+        except Exception as e:
+            result["errors"].append(f"File is not readable: {e}")
+            return result
+        # Detect language
+        language = detect_language(file_path)
+        result["language"] = language
+        if language:
+            result["supported"] = is_language_supported(language)
+            if not result["supported"]:
+                result["errors"].append(f"Language '{language}' is not supported")
+        else:
+            result["errors"].append("Could not detect programming language")
+        # If we got this far with no errors, the file is valid
+        result["valid"] = len(result["errors"]) == 0
+    except Exception as e:
+        result["errors"].append(f"Validation failed: {e}")
+    return result
+def get_framework_info() -> dict[str, Any]:
+    """
+    Get information about the framework and its capabilities.
+    Returns:
+        Framework information dictionary
+    """
+    try:
+        engine = get_engine()
+        return {
+            "name": "tree-sitter-analyzer",
+            "version": __version__,
+            "supported_languages": engine.get_supported_languages(),
+            "total_languages": len(engine.get_supported_languages()),
+            "plugin_info": {
+                "manager_available": engine.plugin_manager is not None,
+                "loaded_plugins": (
+                    len(engine.plugin_manager.get_supported_languages())
+                    if engine.plugin_manager
+                    else 0
+                ),
+            },
+            "core_components": [
+                "AnalysisEngine",
+                "Parser",
+                "QueryExecutor",
+                "PluginManager",
+                "LanguageDetector",
+            ],
+        }
+    except Exception as e:
+        log_error(f"Failed to get framework info: {e}")
+        return {"name": "tree-sitter-analyzer", "version": __version__, "error": str(e)}
+def _group_captures_by_main_node(
+    captures: list[dict[str, Any]],
+) -> list[dict[str, Any]]:
+    """
+    Group query captures by their main nodes (e.g., @method, @class, @function).
+    Each group represents one match of the query pattern, with all its sub-captures.
+    For example, a method_with_annotations query returns:
+    - One @method capture (the main node)
+    - One or more @annotation captures
+    - One @name capture
+    These all get grouped together as one "result".
+    Args:
+        captures: Flat list of all captures from the query
+    Returns:
+        List of grouped results, where each result has a 'captures' dict mapping
+        capture names to their data.
+    """
+    if not captures:
+        return []
+    # Identify the main capture type (method, class, function, etc.)
+    # Usually it's the one with the longest text span or appears first
+    main_capture_types = {"method", "class", "function", "interface", "field"}
+    # Group by start position - captures that share the same main node position
+    position_groups: dict[tuple[int, int], list[dict[str, Any]]] = {}
+    for capture in captures:
+        capture_name = capture.get("capture_name", "")
+        # Find the main node position for this capture
+        if capture_name in main_capture_types:
+            # This is a main node, use its position as the key
+            pos_key = (capture.get("start_byte", 0), capture.get("end_byte", 0))
+        else:
+            # This is a sub-capture, we'll need to find its parent later
+            # For now, use its own position
+            pos_key = (capture.get("start_byte", 0), capture.get("end_byte", 0))
+        if pos_key not in position_groups:
+            position_groups[pos_key] = []
+        position_groups[pos_key].append(capture)
+    # Now group captures that belong together
+    # A capture belongs to a main node if it's within the main node's byte range
+    results = []
+    main_nodes = []
+    # First, identify all main nodes
+    for captures_list in position_groups.values():
+        for capture in captures_list:
+            if capture.get("capture_name") in main_capture_types:
+                main_nodes.append(capture)
+    # For each main node, find all sub-captures within its range
+    for main_node in main_nodes:
+        main_start = main_node.get("start_byte", 0)
+        main_end = main_node.get("end_byte", 0)
+        main_name = main_node.get("capture_name", "")
+        # Collect all captures within this main node's range
+        grouped_captures = {main_name: main_node}
+        for captures_list in position_groups.values():
+            for capture in captures_list:
+                capture_start = capture.get("start_byte", 0)
+                capture_end = capture.get("end_byte", 0)
+                capture_name = capture.get("capture_name", "")
+                # Skip the main node itself
+                if capture is main_node:
+                    continue
+                # Check if this capture is within the main node's range
+                if capture_start >= main_start and capture_end <= main_end:
+                    # Group multiple captures of the same name in a list
+                    if capture_name in grouped_captures:
+                        # Convert to list if not already
+                        if not isinstance(grouped_captures[capture_name], list):
+                            grouped_captures[capture_name] = [
+                                grouped_captures[capture_name]
+                            ]
+                        grouped_captures[capture_name].append(capture)
+                    else:
+                        grouped_captures[capture_name] = capture
+        results.append({"captures": grouped_captures})
+    return results
+def _group_captures_by_main_node(
+    captures: list[dict[str, Any]],
+) -> list[dict[str, Any]]:
+    """
+    Group query captures by their main nodes (e.g., @method, @class, @function).
+    Each group represents one match of the query pattern, with all its sub-captures.
+    For example, a method_with_annotations query returns:
+    - One @method capture (the main node)
+    - One or more @annotation captures
+    - One @name capture
+    These all get grouped together as one "result".
+    Args:
+        captures: Flat list of all captures from the query
+    Returns:
+        List of grouped results, where each result has:
+        - 'captures' dict mapping capture names to their data
+        - Top-level fields from the main node (text, start_line, end_line, etc.)
+    """
+    if not captures:
+        return []
+    # Identify the main capture type (method, class, function, etc.)
+    # Usually it's the one with the longest text span or appears first
+    main_capture_types = {"method", "class", "function", "interface", "field"}
+    # Group by start position - captures that share the same main node position
+    position_groups: dict[tuple[int, int], list[dict[str, Any]]] = {}
+    for capture in captures:
+        capture_name = capture.get("capture_name", "")
+        # Find the main node position for this capture
+        if capture_name in main_capture_types:
+            # This is a main node, use its position as the key
+            pos_key = (capture.get("start_byte", 0), capture.get("end_byte", 0))
+        else:
+            # This is a sub-capture, we'll need to find its parent later
+            # For now, use its own position
+            pos_key = (capture.get("start_byte", 0), capture.get("end_byte", 0))
+        if pos_key not in position_groups:
+            position_groups[pos_key] = []
+        position_groups[pos_key].append(capture)
+    # Now group captures that belong together
+    # A capture belongs to a main node if it's within the main node's byte range
+    results = []
+    main_nodes = []
+    # First, identify all main nodes
+    for captures_list in position_groups.values():
+        for capture in captures_list:
+            if capture.get("capture_name") in main_capture_types:
+                main_nodes.append(capture)
+    # For each main node, find all sub-captures within its range
+    for main_node in main_nodes:
+        main_start = main_node.get("start_byte", 0)
+        main_end = main_node.get("end_byte", 0)
+        main_name = main_node.get("capture_name", "")
+        # Collect all captures within this main node's range
+        grouped_captures = {main_name: main_node}
+        for captures_list in position_groups.values():
+            for capture in captures_list:
+                capture_start = capture.get("start_byte", 0)
+                capture_end = capture.get("end_byte", 0)
+                capture_name = capture.get("capture_name", "")
+                # Skip the main node itself
+                if capture is main_node:
+                    continue
+                # Check if this capture is within the main node's range
+                if capture_start >= main_start and capture_end <= main_end:
+                    # Group multiple captures of the same name in a list
+                    if capture_name in grouped_captures:
+                        # Convert to list if not already
+                        if not isinstance(grouped_captures[capture_name], list):
+                            grouped_captures[capture_name] = [
+                                grouped_captures[capture_name]
+                            ]
+                        grouped_captures[capture_name].append(capture)
+                    else:
+                        grouped_captures[capture_name] = capture
+        # Create result with top-level fields from main node
+        result = {
+            "captures": grouped_captures,
+            "text": main_node.get("text", ""),
+            "start_line": main_node.get("line_number", 0),
+            "end_line": main_node.get("line_number", 0)
+            + main_node.get("text", "").count("\n"),
+            "start_byte": main_start,
+            "end_byte": main_end,
+            "node_type": main_node.get("node_type", ""),
+        }
+        results.append(result)
+    return results
+def execute_query(
+    file_path: str | Path, query_name: str, language: str | None = None
+) -> dict[str, Any]:
+    """
+    Execute a specific query against a file.
+    Args:
+        file_path: Path to the source file
+        query_name: Name of the query to execute
+        language: Programming language (auto-detected if not specified)
+    Returns:
+        Query execution results
+    """
+    try:
+        # Analyze with only the specified query
+        result = analyze_file(
+            file_path,
+            language=language,
+            queries=[query_name],
+            include_elements=False,
+            include_queries=True,
+        )
+        if result["success"] and "query_results" in result:
+            query_result_dict = result["query_results"].get(query_name, {})
+            # Extract the captures list from the query result dictionary
+            if isinstance(query_result_dict, dict) and "captures" in query_result_dict:
+                raw_captures = query_result_dict["captures"]
+            elif isinstance(query_result_dict, list):
+                raw_captures = query_result_dict
+            else:
+                raw_captures = []
+            # Group captures by their main capture (e.g., @method, @class)
+            # This groups related captures together (e.g., method + its annotations + name)
+            query_results = _group_captures_by_main_node(raw_captures)
+            return {
+                "success": True,
+                "query_name": query_name,
+                "results": query_results,
+                "count": len(query_results),
+                "language": result.get("language_info", {}).get("language"),
+                "file_path": str(file_path),
+            }
+        else:
+            return {
+                "success": False,
+                "query_name": query_name,
+                "error": result.get("error", "Unknown error"),
+                "file_path": str(file_path),
+            }
+    except Exception as e:
+        log_error(f"Query execution failed: {e}")
+        return {
+            "success": False,
+            "query_name": query_name,
+            "error": str(e),
+            "file_path": str(file_path),
+        }
+def extract_elements(
+    file_path: str | Path,
+    language: str | None = None,
+    element_types: list[str] | None = None,
+) -> dict[str, Any]:
+    """
+    Extract code elements from a file.
+    Args:
+        file_path: Path to the source file
+        language: Programming language (auto-detected if not specified)
+        element_types: Types of elements to extract (all if not specified)
+    Returns:
+        Element extraction results
+    """
+    try:
+        # Analyze with only element extraction
+        result = analyze_file(
+            file_path, language=language, include_elements=True, include_queries=False
+        )
+        if result["success"] and "elements" in result:
+            elements = result["elements"]
+            # Filter by element types if specified
+            if element_types:
+                filtered_elements = []
+                for element in elements:
+                    if any(
+                        etype.lower() in element.get("type", "").lower()
+                        for etype in element_types
+                    ):
+                        filtered_elements.append(element)
+                elements = filtered_elements
+            return {
+                "success": True,
+                "elements": elements,
+                "count": len(elements),
+                "language": result.get("language_info", {}).get("language"),
+                "file_path": str(file_path),
+            }
+        else:
+            return {
+                "success": False,
+                "error": result.get("error", "Unknown error"),
+                "file_path": str(file_path),
+            }
+    except Exception as e:
+        log_error(f"Element extraction failed: {e}")
+        return {"success": False, "error": str(e), "file_path": str(file_path)}
+# Convenience functions for backward compatibility
+def analyze(file_path: str | Path, **kwargs: Any) -> dict[str, Any]:
+    """Convenience function that aliases to analyze_file."""
+    return analyze_file(file_path, **kwargs)
+def get_languages() -> list[str]:
+    """Convenience function that aliases to get_supported_languages."""
+    return get_supported_languages()