PyPI - tree-sitter-analyzer - Versions diffs - 1.9.2__py3-none-any.whl → 1.9.4__py3-none-any.whl - Mend

tree-sitter-analyzer 1.9.2py3-none-any.whl → 1.9.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of tree-sitter-analyzer might be problematic. Click here for more details.

Files changed (64) hide show

tree_sitter_analyzer/__init__.py +1 -1
tree_sitter_analyzer/api.py +216 -8
tree_sitter_analyzer/cli/argument_validator.py +1 -1
tree_sitter_analyzer/cli/commands/advanced_command.py +3 -6
tree_sitter_analyzer/cli/commands/query_command.py +3 -1
tree_sitter_analyzer/cli/commands/table_command.py +3 -3
tree_sitter_analyzer/constants.py +5 -3
tree_sitter_analyzer/core/analysis_engine.py +1 -1
tree_sitter_analyzer/core/cache_service.py +1 -1
tree_sitter_analyzer/core/engine.py +34 -10
tree_sitter_analyzer/core/query.py +82 -2
tree_sitter_analyzer/encoding_utils.py +64 -0
tree_sitter_analyzer/exceptions.py +1 -1
tree_sitter_analyzer/file_handler.py +49 -33
tree_sitter_analyzer/formatters/base_formatter.py +1 -1
tree_sitter_analyzer/formatters/html_formatter.py +24 -14
tree_sitter_analyzer/formatters/javascript_formatter.py +28 -21
tree_sitter_analyzer/formatters/language_formatter_factory.py +7 -4
tree_sitter_analyzer/formatters/markdown_formatter.py +4 -4
tree_sitter_analyzer/formatters/python_formatter.py +4 -4
tree_sitter_analyzer/formatters/typescript_formatter.py +1 -1
tree_sitter_analyzer/interfaces/mcp_adapter.py +4 -2
tree_sitter_analyzer/interfaces/mcp_server.py +10 -10
tree_sitter_analyzer/language_detector.py +30 -5
tree_sitter_analyzer/language_loader.py +46 -26
tree_sitter_analyzer/languages/css_plugin.py +6 -6
tree_sitter_analyzer/languages/html_plugin.py +12 -8
tree_sitter_analyzer/languages/java_plugin.py +330 -520
tree_sitter_analyzer/languages/javascript_plugin.py +22 -78
tree_sitter_analyzer/languages/markdown_plugin.py +277 -297
tree_sitter_analyzer/languages/python_plugin.py +47 -85
tree_sitter_analyzer/languages/typescript_plugin.py +48 -123
tree_sitter_analyzer/mcp/resources/project_stats_resource.py +14 -8
tree_sitter_analyzer/mcp/server.py +38 -23
tree_sitter_analyzer/mcp/tools/analyze_scale_tool.py +10 -7
tree_sitter_analyzer/mcp/tools/analyze_scale_tool_cli_compatible.py +51 -7
tree_sitter_analyzer/mcp/tools/fd_rg_utils.py +11 -7
tree_sitter_analyzer/mcp/tools/find_and_grep_tool.py +8 -6
tree_sitter_analyzer/mcp/tools/list_files_tool.py +6 -6
tree_sitter_analyzer/mcp/tools/output_format_validator.py +148 -0
tree_sitter_analyzer/mcp/tools/search_content_tool.py +48 -15
tree_sitter_analyzer/mcp/tools/table_format_tool.py +13 -8
tree_sitter_analyzer/mcp/utils/file_output_manager.py +8 -3
tree_sitter_analyzer/mcp/utils/gitignore_detector.py +24 -12
tree_sitter_analyzer/mcp/utils/path_resolver.py +2 -2
tree_sitter_analyzer/models.py +16 -0
tree_sitter_analyzer/mypy_current_errors.txt +2 -0
tree_sitter_analyzer/plugins/base.py +66 -0
tree_sitter_analyzer/queries/java.py +9 -3
tree_sitter_analyzer/queries/javascript.py +3 -8
tree_sitter_analyzer/queries/markdown.py +1 -1
tree_sitter_analyzer/queries/python.py +2 -2
tree_sitter_analyzer/security/boundary_manager.py +2 -5
tree_sitter_analyzer/security/regex_checker.py +2 -2
tree_sitter_analyzer/security/validator.py +5 -1
tree_sitter_analyzer/table_formatter.py +4 -4
tree_sitter_analyzer/utils/__init__.py +27 -116
tree_sitter_analyzer/{utils.py → utils/logging.py} +2 -2
tree_sitter_analyzer/utils/tree_sitter_compat.py +2 -2
{tree_sitter_analyzer-1.9.2.dist-info → tree_sitter_analyzer-1.9.4.dist-info}/METADATA +87 -45
tree_sitter_analyzer-1.9.4.dist-info/RECORD +111 -0
tree_sitter_analyzer-1.9.2.dist-info/RECORD +0 -109
{tree_sitter_analyzer-1.9.2.dist-info → tree_sitter_analyzer-1.9.4.dist-info}/WHEEL +0 -0
{tree_sitter_analyzer-1.9.2.dist-info → tree_sitter_analyzer-1.9.4.dist-info}/entry_points.txt +0 -0

tree_sitter_analyzer/languages/java_plugin.py CHANGED Viewed

@@ -7,7 +7,7 @@ Migrated from AdvancedAnalyzer implementation for future independence.
 """
 import re
-from typing import TYPE_CHECKING, Any, Optional
+from typing import TYPE_CHECKING, Any
 if TYPE_CHECKING:
     import tree_sitter
@@ -16,7 +16,7 @@ if TYPE_CHECKING:
     from ..models import AnalysisResult
 from ..encoding_utils import extract_text_slice, safe_encode
-from ..models import Class, CodeElement, Function, Import, Package, Variable
+from ..models import Class, Function, Import, Package, Variable
 from ..plugins.base import ElementExtractor, LanguagePlugin
 from ..utils import log_debug, log_error, log_warning
@@ -258,16 +258,13 @@ class JavaElementExtractor(ElementExtractor):
         packages: list[Package] = []
         # Extract package declaration
-        if tree is None or tree.root_node is None:
-            log_debug("Tree or root_node is None, returning empty packages list")
-            return packages
-        for child in tree.root_node.children:
-            if child.type == "package_declaration":
-                package_info = self._extract_package_element(child)
-                if package_info:
-                    packages.append(package_info)
-                break  # Only one package declaration per file
+        if tree and tree.root_node:
+            for child in tree.root_node.children:
+                if child.type == "package_declaration":
+                    package_info = self._extract_package_element(child)
+                    if package_info:
+                        packages.append(package_info)
+                    break  # Only one package declaration per file
         log_debug(f"Extracted {len(packages)} packages")
         return packages
@@ -456,7 +453,8 @@ class JavaElementExtractor(ElementExtractor):
                 if start_point[0] == end_point[0]:
                     # Single line
                     line = self.content_lines[start_point[0]]
-                    return line[start_point[1] : end_point[1]]
+                    result: str = line[start_point[1] : end_point[1]]
+                    return result
                 else:
                     # Multiple lines
                     lines = []
@@ -835,623 +833,435 @@ class JavaElementExtractor(ElementExtractor):
             log_debug(f"Failed to extract package element: {e}")
         except Exception as e:
             log_error(f"Unexpected error in package element extraction: {e}")
         return None
     def _extract_package_from_tree(self, tree: "tree_sitter.Tree") -> None:
-        """
-        Extract package information from the tree and set current_package.
-        This method ensures that package information is available for class extraction
-        regardless of the order in which extraction methods are called.
-        """
-        try:
-            # Look for package declaration in the root node's children
+        """Extract package information from tree when needed"""
+        if tree and tree.root_node:
             for child in tree.root_node.children:
                 if child.type == "package_declaration":
                     self._extract_package_info(child)
-                    break  # Only one package declaration per file
-        except Exception as e:
-            log_debug(f"Failed to extract package from tree: {e}")
-    def _determine_visibility(self, modifiers: list[str]) -> str:
-        """Determine visibility from modifiers"""
-        if "public" in modifiers:
-            return "public"
-        elif "private" in modifiers:
-            return "private"
-        elif "protected" in modifiers:
-            return "protected"
-        else:
-            return "package"  # Default package visibility
-    def _find_annotations_for_line_cached(
-        self, target_line: int
-    ) -> list[dict[str, Any]]:
-        """Find annotations for specified line with caching (from AdvancedAnalyzer)"""
-        if target_line in self._annotation_cache:
-            return self._annotation_cache[target_line]
-        result_annotations = []
-        for annotation in self.annotations:
-            line_distance = target_line - annotation.get("end_line", 0)
-            if 1 <= line_distance <= 5:
-                result_annotations.append(annotation)
-        self._annotation_cache[target_line] = result_annotations
-        return result_annotations
-    def _calculate_complexity_optimized(self, node: "tree_sitter.Node") -> int:
-        """Calculate cyclomatic complexity efficiently (from AdvancedAnalyzer)"""
-        complexity = 1
-        try:
-            node_text = self._get_node_text_optimized(node).lower()
-            keywords = ["if", "while", "for", "catch", "case", "switch"]
-            for keyword in keywords:
-                complexity += node_text.count(keyword)
-        except (AttributeError, TypeError) as e:
-            log_debug(f"Failed to calculate complexity: {e}")
-        except Exception as e:
-            log_error(f"Unexpected error in complexity calculation: {e}")
-        return complexity
-    def _extract_javadoc_for_line(self, target_line: int) -> str | None:
-        """Extract JavaDoc comment immediately before the specified line"""
-        try:
-            if not self.content_lines or target_line <= 1:
-                return None
-            # Search backwards from target_line
-            javadoc_lines = []
-            current_line = target_line - 1
-            # Skip empty lines
-            while current_line > 0:
-                line = self.content_lines[current_line - 1].strip()
-                if line:
                     break
-                current_line -= 1
-            # Check for JavaDoc end
-            if current_line > 0:
-                line = self.content_lines[current_line - 1].strip()
-                if line.endswith("*/"):
-                    # This might be a JavaDoc comment
-                    javadoc_lines.append(self.content_lines[current_line - 1])
-                    current_line -= 1
-                    # Collect JavaDoc content
-                    while current_line > 0:
-                        line_content = self.content_lines[current_line - 1]
-                        line_stripped = line_content.strip()
-                        javadoc_lines.append(line_content)
-                        if line_stripped.startswith("/**"):
-                            # Found the start of JavaDoc
-                            javadoc_lines.reverse()
-                            javadoc_text = "\n".join(javadoc_lines)
-                            # Clean up the JavaDoc
-                            return self._clean_javadoc(javadoc_text)
-                        current_line -= 1
-            return None
-        except Exception as e:
-            log_debug(f"Failed to extract JavaDoc: {e}")
-            return None
-    def _clean_javadoc(self, javadoc_text: str) -> str:
-        """Clean JavaDoc text by removing comment markers"""
-        if not javadoc_text:
-            return ""
-        lines = javadoc_text.split("\n")
-        cleaned_lines = []
-        for line in lines:
-            # Remove leading/trailing whitespace
-            line = line.strip()
-            # Remove comment markers
-            if line.startswith("/**"):
-                line = line[3:].strip()
-            elif line.startswith("*/"):
-                line = line[2:].strip()
-            elif line.startswith("*"):
-                line = line[1:].strip()
-            if line:  # Only add non-empty lines
-                cleaned_lines.append(line)
-        return " ".join(cleaned_lines) if cleaned_lines else ""
-    def _is_nested_class(self, node: "tree_sitter.Node") -> bool:
-        """Check if this is a nested class (from AdvancedAnalyzer)"""
-        current = node.parent
-        while current:
-            if current.type in [
-                "class_declaration",
-                "interface_declaration",
-                "enum_declaration",
-            ]:
-                return True
-            current = current.parent
-        return False
-    def _find_parent_class(self, node: "tree_sitter.Node") -> str | None:
-        """Find parent class name (from AdvancedAnalyzer)"""
-        current = node.parent
-        while current:
-            if current.type in [
-                "class_declaration",
-                "interface_declaration",
-                "enum_declaration",
-            ]:
-                return self._extract_class_name(current)
-            current = current.parent
-        return None
-    def _extract_class_name(self, node: "tree_sitter.Node") -> str | None:
-        """Extract class name from node (from AdvancedAnalyzer)"""
-        for child in node.children:
-            if child.type == "identifier":
-                return self._get_node_text_optimized(child)
-        return None
-    def _extract_annotation_optimized(
-        self, node: "tree_sitter.Node"
-    ) -> dict[str, Any] | None:
-        """Extract annotation information optimized (from AdvancedAnalyzer)"""
-        try:
-            start_line = node.start_point[0] + 1
-            end_line = node.end_point[0] + 1
-            raw_text = self._get_node_text_optimized(node)
-            # Extract annotation name efficiently
-            name_match = re.search(r"@(\w+)", raw_text)
-            if not name_match:
-                return None
-            annotation_name = name_match.group(1)
-            # Extract parameters efficiently
-            parameters = []
-            param_match = re.search(r"\((.*?)\)", raw_text, re.DOTALL)
-            if param_match:
-                param_text = param_match.group(1).strip()
-                if param_text:
-                    # Simple parameter parsing
-                    if "=" in param_text:
-                        parameters = [
-                            p.strip() for p in re.split(r",(?![^()]*\))", param_text)
-                        ]
-                    else:
-                        parameters = [param_text]
-            return {
-                "name": annotation_name,
-                "parameters": parameters,
-                "start_line": start_line,
-                "end_line": end_line,
-                "raw_text": raw_text,
-            }
-        except (AttributeError, IndexError, ValueError) as e:
-            log_debug(f"Failed to extract annotation from node: {e}")
-            return None
-        except Exception as e:
-            log_error(f"Unexpected exception in annotation extraction: {e}")
-            return None
     def _extract_import_info(
         self, node: "tree_sitter.Node", source_code: str
     ) -> Import | None:
-        """Extract import information (from AdvancedAnalyzer)"""
+        """Extract import information from import declaration node"""
         try:
             import_text = self._get_node_text_optimized(node)
-            # Simple approach: get everything until semicolon then process
-            import_content = import_text.strip()
-            if import_content.endswith(";"):
-                import_content = import_content[:-1]
+            line_num = node.start_point[0] + 1
-            if "static" in import_content:
+            # Parse import statement
+            if "static" in import_text:
                 # Static import
-                static_match = re.search(r"import\s+static\s+([\w.]+)", import_content)
+                static_match = re.search(r"import\s+static\s+([\w.]+)", import_text)
                 if static_match:
                     import_name = static_match.group(1)
-                    # Handle wildcard case
-                    if import_content.endswith(".*"):
+                    if import_text.endswith(".*"):
                         import_name = import_name.replace(".*", "")
-                    # For static imports, extract the class name (remove method/field name)
+                    # For static imports, extract the class name
                     parts = import_name.split(".")
                     if len(parts) > 1:
-                        # Remove the last part (method/field name) to get class name
                         import_name = ".".join(parts[:-1])
                     return Import(
                         name=import_name,
-                        start_line=node.start_point[0] + 1,
-                        end_line=node.end_point[0] + 1,
+                        start_line=line_num,
+                        end_line=line_num,
                         raw_text=import_text,
                         language="java",
                         module_name=import_name,
                         is_static=True,
-                        is_wildcard=import_content.endswith(".*"),
-                        import_statement=import_content,
+                        is_wildcard=import_text.endswith(".*"),
+                        import_statement=import_text,
                     )
             else:
                 # Normal import
-                normal_match = re.search(r"import\s+([\w.]+)", import_content)
+                normal_match = re.search(r"import\s+([\w.]+)", import_text)
                 if normal_match:
                     import_name = normal_match.group(1)
-                    # Handle wildcard case
-                    if import_content.endswith(".*"):
+                    if import_text.endswith(".*"):
                         if import_name.endswith(".*"):
-                            import_name = import_name[:-2]  # Remove trailing .*
+                            import_name = import_name[:-2]
                         elif import_name.endswith("."):
-                            import_name = import_name[:-1]  # Remove trailing .
+                            import_name = import_name[:-1]
                     return Import(
                         name=import_name,
-                        start_line=node.start_point[0] + 1,
-                        end_line=node.end_point[0] + 1,
+                        start_line=line_num,
+                        end_line=line_num,
                         raw_text=import_text,
                         language="java",
                         module_name=import_name,
                         is_static=False,
-                        is_wildcard=import_content.endswith(".*"),
-                        import_statement=import_content,
+                        is_wildcard=import_text.endswith(".*"),
+                        import_statement=import_text,
                     )
-        except (AttributeError, ValueError, IndexError) as e:
-            log_debug(f"Failed to extract import info: {e}")
         except Exception as e:
-            log_error(f"Unexpected error in import extraction: {e}")
-        return None
+            log_debug(f"Failed to extract import info: {e}")
-    def extract_elements(self, tree: "tree_sitter.Tree", source_code: str) -> list:
-        """Extract elements from source code using tree-sitter AST"""
-        elements = []
+        return None
+    def _extract_annotation_optimized(
+        self, node: "tree_sitter.Node"
+    ) -> dict[str, Any] | None:
+        """Extract annotation information optimized"""
         try:
-            elements.extend(self.extract_functions(tree, source_code))
-            elements.extend(self.extract_classes(tree, source_code))
-            elements.extend(self.extract_variables(tree, source_code))
-            elements.extend(self.extract_imports(tree, source_code))
-        except Exception as e:
-            log_error(f"Failed to extract elements: {e}")
-        return elements
-class JavaPlugin(LanguagePlugin):
-    """Java language plugin for the new architecture"""
+            annotation_text = self._get_node_text_optimized(node)
+            start_line = node.start_point[0] + 1
-    def __init__(self) -> None:
-        """Initialize the Java plugin"""
-        super().__init__()
-        self._language_cache: tree_sitter.Language | None = None
-        self._extractor: JavaElementExtractor | None = None
+            # Extract annotation name
+            annotation_name = None
+            for child in node.children:
+                if child.type == "identifier":
+                    annotation_name = self._get_node_text_optimized(child)
+                    break
-        # Legacy attributes for backward compatibility with tests
-        self.language = "java"
-        self.extractor = self.create_extractor()
-        self.supported_extensions = self.get_file_extensions()
+            if not annotation_name:
+                # Try to extract from text
+                match = re.search(r"@(\w+)", annotation_text)
+                if match:
+                    annotation_name = match.group(1)
+            if annotation_name:
+                return {
+                    "name": annotation_name,
+                    "line": start_line,
+                    "text": annotation_text,
+                    "type": "annotation",
+                }
+        except Exception as e:
+            log_debug(f"Failed to extract annotation: {e}")
-    def get_language_name(self) -> str:
-        """Return the name of the programming language this plugin supports"""
-        return "java"
+        return None
-    def get_file_extensions(self) -> list[str]:
-        """Return list of file extensions this plugin supports"""
-        return [".java", ".jsp", ".jspx"]
+    def _determine_visibility(self, modifiers: list[str]) -> str:
+        """Determine visibility from modifiers"""
+        if "public" in modifiers:
+            return "public"
+        elif "private" in modifiers:
+            return "private"
+        elif "protected" in modifiers:
+            return "protected"
+        else:
+            return "package"
-    def create_extractor(self) -> ElementExtractor:
-        """Create and return an element extractor for this language"""
-        return JavaElementExtractor()
+    def _find_annotations_for_line_cached(self, line: int) -> list[dict[str, Any]]:
+        """Find annotations for a specific line with caching"""
+        if line in self._annotation_cache:
+            return self._annotation_cache[line]
-    def get_extractor(self) -> ElementExtractor:
-        """Get the cached extractor instance, creating it if necessary"""
-        if self._extractor is None:
-            self._extractor = JavaElementExtractor()
-        return self._extractor
+        # Find annotations near this line
+        annotations = []
+        for annotation in self.annotations:
+            if abs(annotation.get("line", 0) - line) <= 2:
+                annotations.append(annotation)
-    def get_tree_sitter_language(self) -> Optional["tree_sitter.Language"]:
-        """Get the Tree-sitter language object for Java"""
-        if self._language_cache is None:
-            try:
-                import tree_sitter_java as tsjava
+        self._annotation_cache[line] = annotations
+        return annotations
-                self._language_cache = tsjava.language()  # type: ignore
-            except ImportError:
-                log_error("tree-sitter-java not available")
-                return None
-            except Exception as e:
-                log_error(f"Failed to load Java language: {e}")
-                return None
-        return self._language_cache
+    def _is_nested_class(self, node: "tree_sitter.Node") -> bool:
+        """Check if this is a nested class"""
+        parent = node.parent
+        while parent:
+            if parent.type in [
+                "class_declaration",
+                "interface_declaration",
+                "enum_declaration",
+            ]:
+                return True
+            parent = parent.parent
+        return False
-    def get_supported_queries(self) -> list[str]:
-        """Get list of supported query names for this language"""
-        return ["class", "method", "field", "import"]
+    def _find_parent_class(self, node: "tree_sitter.Node") -> str | None:
+        """Find parent class name for nested classes"""
+        parent = node.parent
+        while parent:
+            if parent.type in [
+                "class_declaration",
+                "interface_declaration",
+                "enum_declaration",
+            ]:
+                for child in parent.children:
+                    if child.type == "identifier":
+                        return self._get_node_text_optimized(child)
+            parent = parent.parent
+        return None
-    def is_applicable(self, file_path: str) -> bool:
-        """Check if this plugin is applicable for the given file"""
-        return any(
-            file_path.lower().endswith(ext.lower())
-            for ext in self.get_file_extensions()
-        )
+    def _calculate_complexity_optimized(self, node: "tree_sitter.Node") -> int:
+        """Calculate cyclomatic complexity optimized"""
+        complexity = 1  # Base complexity
+        # Count decision points
+        decision_nodes = [
+            "if_statement",
+            "while_statement",
+            "for_statement",
+            "switch_statement",
+            "catch_clause",
+            "conditional_expression",
+            "enhanced_for_statement",
+        ]
+        def count_decisions(n: "tree_sitter.Node") -> int:
+            count = 0
+            if hasattr(n, "type") and n.type in decision_nodes:
+                count += 1
+            if hasattr(n, "children"):
+                try:
+                    for child in n.children:
+                        count += count_decisions(child)
+                except (TypeError, AttributeError):
+                    # Handle Mock objects or other non-iterable children
+                    pass
+            return count
+        complexity += count_decisions(node)
+        return complexity
-    def get_plugin_info(self) -> dict:
-        """Get information about this plugin"""
-        return {
-            "name": "Java Plugin",
-            "language": self.get_language_name(),
-            "extensions": self.get_file_extensions(),
-            "version": "2.0.0",
-            "supported_queries": self.get_supported_queries(),
-        }
+    def _extract_javadoc_for_line(self, line: int) -> str | None:
+        """Extract JavaDoc comment for a specific line"""
+        try:
+            # Look for JavaDoc comment before the line
+            for i in range(max(0, line - 10), line):
+                if i < len(self.content_lines):
+                    line_content = self.content_lines[i].strip()
+                    if line_content.startswith("/**"):
+                        # Found start of JavaDoc, collect until */
+                        javadoc_lines = []
+                        for j in range(i, min(len(self.content_lines), line)):
+                            doc_line = self.content_lines[j].strip()
+                            javadoc_lines.append(doc_line)
+                            if doc_line.endswith("*/"):
+                                break
+                        return "\n".join(javadoc_lines)
+        except Exception as e:
+            log_debug(f"Failed to extract JavaDoc: {e}")
-    def execute_query_strategy(
-        self, tree: "tree_sitter.Tree", source_code: str, query_key: str
-    ) -> list[dict]:
-        """
-        Execute query strategy for Java language
+        return None
-        Args:
-            tree: Tree-sitter tree object
-            source_code: Source code string
-            query_key: Query key to execute
+    def _extract_class_name(self, node: "tree_sitter.Node") -> str | None:
+        """Extract class name from a class declaration node."""
+        try:
+            for child in node.children:
+                if child.type == "identifier":
+                    return self._get_node_text_optimized(child)
+            return None
+        except Exception as e:
+            log_debug(f"Failed to extract class name: {e}")
+            return None
-        Returns:
-            List of query results
-        """
-        # Use the extractor to get elements based on query_key
-        extractor = self.get_extractor()
-        # Map query keys to extraction methods
-        if query_key in ["method", "methods", "function", "functions"]:
-            elements = extractor.extract_functions(tree, source_code)
-        elif query_key in ["class", "classes"]:
-            elements = extractor.extract_classes(tree, source_code)
-        elif query_key in ["field", "fields", "variable", "variables"]:
-            elements = extractor.extract_variables(tree, source_code)
-        elif query_key in ["import", "imports"]:
-            elements = extractor.extract_imports(tree, source_code)
-        elif query_key in ["package", "packages"]:
-            elements = extractor.extract_packages(tree, source_code)
-        elif query_key in ["annotation", "annotations"]:
-            elements = extractor.extract_annotations(tree, source_code)
-        else:
-            # For unknown query keys, return empty list
-            return []
-        # Convert elements to query result format
-        results = []
-        for element in elements:
-            result = {
-                "capture_name": query_key,
-                "node_type": self._get_node_type_for_element(element),
-                "start_line": element.start_line,
-                "end_line": element.end_line,
-                "text": element.raw_text,
-                "name": element.name,
-            }
-            results.append(result)
-        return results
+class JavaPlugin(LanguagePlugin):
+    """Java language plugin implementation"""
-    def _get_node_type_for_element(self, element) -> str:
-        """Get appropriate node type for element"""
-        from ..models import Class, Function, Import, Package, Variable
+    def __init__(self) -> None:
+        """Initialize the Java language plugin."""
+        super().__init__()
+        self.extractor = JavaElementExtractor()
+        self.language = "java"  # Add language property for test compatibility
+        self.supported_extensions = (
+            self.get_file_extensions()
+        )  # Add for test compatibility
+        self._cached_language: Any | None = None  # Cache for tree-sitter language
-        if isinstance(element, Function):
-            return (
-                "method_declaration"
-                if not element.is_constructor
-                else "constructor_declaration"
-            )
-        elif isinstance(element, Class):
-            if element.class_type == "interface":
-                return "interface_declaration"
-            elif element.class_type == "enum":
-                return "enum_declaration"
-            else:
-                return "class_declaration"
-        elif isinstance(element, Variable):
-            return "field_declaration"
-        elif isinstance(element, Import):
-            return "import_declaration"
-        elif isinstance(element, Package):
-            return "package_declaration"
-        else:
-            return "unknown"
+    def get_language_name(self) -> str:
+        """Get the language name."""
+        return "java"
-    def get_element_categories(self) -> dict[str, list[str]]:
-        """
-        Get element categories mapping query keys to node types
+    def get_file_extensions(self) -> list[str]:
+        """Get supported file extensions."""
+        return [".java", ".jsp", ".jspx"]
-        Returns:
-            Dictionary mapping query keys to lists of node types
-        """
-        return {
-            # Method-related queries
-            "method": ["method_declaration"],
-            "methods": ["method_declaration"],
-            "constructor": ["constructor_declaration"],
-            "constructors": ["constructor_declaration"],
-            # Class-related queries
-            "class": ["class_declaration"],
-            "classes": ["class_declaration"],
-            "interface": ["interface_declaration"],
-            "interfaces": ["interface_declaration"],
-            "enum": ["enum_declaration"],
-            "enums": ["enum_declaration"],
-            # Field-related queries
-            "field": ["field_declaration"],
-            "fields": ["field_declaration"],
-            # Import-related queries
-            "import": ["import_declaration"],
-            "imports": ["import_declaration"],
-            # Package-related queries
-            "package": ["package_declaration"],
-            "packages": ["package_declaration"],
-            # Annotation-related queries
-            "annotation": ["annotation", "marker_annotation"],
-            "annotations": ["annotation", "marker_annotation"],
-            # Generic queries
-            "all_elements": [
-                "method_declaration",
-                "constructor_declaration",
-                "class_declaration",
-                "interface_declaration",
-                "enum_declaration",
-                "field_declaration",
-                "import_declaration",
-                "package_declaration",
-                "annotation",
-                "marker_annotation",
-            ],
-        }
+    def create_extractor(self) -> ElementExtractor:
+        """Create a new element extractor instance."""
+        return JavaElementExtractor()
     async def analyze_file(
         self, file_path: str, request: "AnalysisRequest"
     ) -> "AnalysisResult":
-        """
-        Analyze a Java file and return analysis results.
+        """Analyze Java code and return structured results."""
-        Args:
-            file_path: Path to the Java file to analyze
-            request: Analysis request object
+        from ..models import AnalysisResult
-        Returns:
-            AnalysisResult object containing the analysis results
-        """
         try:
-            from ..core.parser import Parser
-            from ..models import AnalysisResult
-            log_debug(f"Java Plugin: Starting analysis of {file_path}")
-            # Read file content
-            with open(file_path, encoding="utf-8") as f:
-                source_code = f.read()
-            log_debug(f"Java Plugin: Read {len(source_code)} characters from file")
+            # Read the file content using safe encoding detection
+            from ..encoding_utils import read_file_safe
-            # Parse the file
-            parser = Parser()
-            parse_result = parser.parse_code(source_code, "java")
+            file_content, detected_encoding = read_file_safe(file_path)
-            log_debug(f"Java Plugin: Parse result success: {parse_result.success}")
-            if not parse_result.success:
-                log_error(f"Java Plugin: Parse failed: {parse_result.error_message}")
+            # Get tree-sitter language and parse
+            language = self.get_tree_sitter_language()
+            if language is None:
+                # Return empty result if language loading fails
                 return AnalysisResult(
                     file_path=file_path,
                     language="java",
-                    line_count=len(source_code.splitlines()),
+                    line_count=len(file_content.split("\n")),
                     elements=[],
-                    node_count=0,
-                    query_results={},
-                    source_code=source_code,
-                    success=False,
-                    error_message=parse_result.error_message,
+                    source_code=file_content,
                 )
-            # Extract elements
-            extractor = self.create_extractor()
+            # Parse the code
+            import tree_sitter
+            parser = tree_sitter.Parser()
-            if parse_result.tree:
-                log_debug("Java Plugin: Extracting packages...")
-                packages = extractor.extract_packages(parse_result.tree, source_code)
-                log_debug(f"Java Plugin: Found {len(packages)} packages")
+            # Set language using the appropriate method
+            if hasattr(parser, "set_language"):
+                parser.set_language(language)
+            elif hasattr(parser, "language"):
+                parser.language = language
+            else:
+                # Try constructor approach as last resort
+                try:
+                    parser = tree_sitter.Parser(language)
+                except Exception as e:
+                    log_error(f"Failed to create parser with language: {e}")
+                    return AnalysisResult(
+                        file_path=file_path,
+                        language="java",
+                        line_count=len(file_content.split("\n")),
+                        elements=[],
+                        source_code=file_content,
+                        error_message=f"Parser creation failed: {e}",
+                        success=False,
+                    )
-                log_debug("Java Plugin: Extracting functions...")
-                functions = extractor.extract_functions(parse_result.tree, source_code)
-                log_debug(f"Java Plugin: Found {len(functions)} functions")
+            tree = parser.parse(file_content.encode("utf-8"))
-                log_debug("Java Plugin: Extracting classes...")
-                classes = extractor.extract_classes(parse_result.tree, source_code)
-                log_debug(f"Java Plugin: Found {len(classes)} classes")
+            # Extract elements using our extractor
+            elements_dict = self.extract_elements(tree, file_content)
-                log_debug("Java Plugin: Extracting variables...")
-                variables = extractor.extract_variables(parse_result.tree, source_code)
-                log_debug(f"Java Plugin: Found {len(variables)} variables")
+            # Combine all elements into a single list
+            all_elements = []
+            all_elements.extend(elements_dict.get("functions", []))
+            all_elements.extend(elements_dict.get("classes", []))
+            all_elements.extend(elements_dict.get("variables", []))
+            all_elements.extend(elements_dict.get("imports", []))
+            all_elements.extend(elements_dict.get("packages", []))
-                log_debug("Java Plugin: Extracting imports...")
-                imports = extractor.extract_imports(parse_result.tree, source_code)
-                log_debug(f"Java Plugin: Found {len(imports)} imports")
-            else:
-                packages = []
-                functions = []
-                classes = []
-                variables = []
-                imports = []
-            # Combine all elements
-            all_elements: list[CodeElement] = []
-            all_elements.extend(packages)
-            all_elements.extend(functions)
-            all_elements.extend(classes)
-            all_elements.extend(variables)
-            all_elements.extend(imports)
-            log_debug(f"Java Plugin: Total elements: {len(all_elements)}")
+            # Get package info if available
+            packages = elements_dict.get("packages", [])
+            package = packages[0] if packages else None
+            # Count nodes in the AST tree
+            node_count = self._count_tree_nodes(tree.root_node) if tree and tree.root_node else 0
             return AnalysisResult(
                 file_path=file_path,
                 language="java",
-                line_count=len(source_code.splitlines()),
+                line_count=len(file_content.split("\n")),
                 elements=all_elements,
-                node_count=(
-                    parse_result.tree.root_node.child_count if parse_result.tree else 0
-                ),
-                query_results={},
-                source_code=source_code,
-                success=True,
-                error_message=None,
+                node_count=node_count,
+                source_code=file_content,
+                package=package,
             )
         except Exception as e:
-            log_error(f"Failed to analyze Java file {file_path}: {e}")
-            import traceback
-            log_error(f"Java Plugin traceback: {traceback.format_exc()}")
+            log_error(f"Error analyzing Java file {file_path}: {e}")
+            # Return empty result on error
             return AnalysisResult(
                 file_path=file_path,
                 language="java",
                 line_count=0,
                 elements=[],
-                node_count=0,
-                query_results={},
                 source_code="",
-                success=False,
                 error_message=str(e),
+                success=False,
             )
-    def extract_elements(
-        self, tree: "tree_sitter.Tree", source_code: str
-    ) -> dict[str, list[CodeElement]]:
-        """Legacy method for backward compatibility with tests"""
-        if not tree or not tree.root_node:
+    def _count_tree_nodes(self, node: Any) -> int:
+        """
+        Recursively count nodes in the AST tree.
+        Args:
+            node: Tree-sitter node
+        Returns:
+            Total number of nodes
+        """
+        if node is None:
+            return 0
+        count = 1  # Count current node
+        if hasattr(node, "children"):
+            for child in node.children:
+                count += self._count_tree_nodes(child)
+        return count
+    def get_tree_sitter_language(self) -> Any | None:
+        """Get the tree-sitter language for Java."""
+        if self._cached_language is not None:
+            return self._cached_language
+        try:
+            import tree_sitter
+            import tree_sitter_java
+            # Get the language function result
+            caps_or_lang = tree_sitter_java.language()
+            # Convert to proper Language object if needed
+            if hasattr(caps_or_lang, "__class__") and "Language" in str(
+                type(caps_or_lang)
+            ):
+                # Already a Language object
+                self._cached_language = caps_or_lang
+            else:
+                # PyCapsule - convert to Language object
+                try:
+                    # Use modern tree-sitter API - PyCapsule should be passed to Language constructor
+                    self._cached_language = tree_sitter.Language(caps_or_lang)
+                except Exception as e:
+                    log_error(f"Failed to create Language object from PyCapsule: {e}")
+                    return None
+            return self._cached_language
+        except ImportError as e:
+            log_error(f"tree-sitter-java not available: {e}")
+            return None
+        except Exception as e:
+            log_error(f"Failed to load tree-sitter language for Java: {e}")
+            return None
+    def extract_elements(self, tree: Any | None, source_code: str) -> dict[str, Any]:
+        """Extract all elements from Java code for test compatibility."""
+        if tree is None:
             return {
-                "packages": [],
                 "functions": [],
                 "classes": [],
                 "variables": [],
                 "imports": [],
+                "packages": [],
                 "annotations": [],
             }
-        extractor = self.create_extractor()
-        # Extract all types of elements and return as dictionary
-        result = {
-            "packages": extractor.extract_packages(tree, source_code),
-            "functions": extractor.extract_functions(tree, source_code),
-            "classes": extractor.extract_classes(tree, source_code),
-            "variables": extractor.extract_variables(tree, source_code),
-            "imports": extractor.extract_imports(tree, source_code),
-            "annotations": extractor.extract_annotations(tree, source_code),
-        }
+        try:
+            extractor = self.create_extractor()
+            return {
+                "functions": extractor.extract_functions(tree, source_code),
+                "classes": extractor.extract_classes(tree, source_code),
+                "variables": extractor.extract_variables(tree, source_code),
+                "imports": extractor.extract_imports(tree, source_code),
+                "packages": extractor.extract_packages(tree, source_code),
+                "annotations": extractor.extract_annotations(tree, source_code),
+            }
+        except Exception as e:
+            log_error(f"Error extracting elements: {e}")
+            return {
+                "functions": [],
+                "classes": [],
+                "variables": [],
+                "imports": [],
+                "packages": [],
+                "annotations": [],
+            }
-        return result
+    def supports_file(self, file_path: str) -> bool:
+        """Check if this plugin supports the given file."""
+        return any(
+            file_path.lower().endswith(ext) for ext in self.get_file_extensions()
+        )

tree-sitter-analyzer 1.9.2__py3-none-any.whl → 1.9.4__py3-none-any.whl

Potentially problematic release.

tree-sitter-analyzer 1.9.2py3-none-any.whl → 1.9.4py3-none-any.whl