tree-sitter-analyzer 0.1.3__py3-none-any.whl → 0.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of tree-sitter-analyzer might be problematic. Click here for more details.

Files changed (79) hide show
  1. tree_sitter_analyzer/__init__.py +133 -121
  2. tree_sitter_analyzer/__main__.py +11 -12
  3. tree_sitter_analyzer/api.py +531 -539
  4. tree_sitter_analyzer/cli/__init__.py +39 -39
  5. tree_sitter_analyzer/cli/__main__.py +12 -13
  6. tree_sitter_analyzer/cli/commands/__init__.py +26 -27
  7. tree_sitter_analyzer/cli/commands/advanced_command.py +88 -88
  8. tree_sitter_analyzer/cli/commands/base_command.py +160 -155
  9. tree_sitter_analyzer/cli/commands/default_command.py +18 -19
  10. tree_sitter_analyzer/cli/commands/partial_read_command.py +141 -133
  11. tree_sitter_analyzer/cli/commands/query_command.py +81 -82
  12. tree_sitter_analyzer/cli/commands/structure_command.py +138 -121
  13. tree_sitter_analyzer/cli/commands/summary_command.py +101 -93
  14. tree_sitter_analyzer/cli/commands/table_command.py +232 -233
  15. tree_sitter_analyzer/cli/info_commands.py +120 -121
  16. tree_sitter_analyzer/cli_main.py +277 -276
  17. tree_sitter_analyzer/core/__init__.py +15 -20
  18. tree_sitter_analyzer/core/analysis_engine.py +591 -574
  19. tree_sitter_analyzer/core/cache_service.py +320 -330
  20. tree_sitter_analyzer/core/engine.py +557 -560
  21. tree_sitter_analyzer/core/parser.py +293 -288
  22. tree_sitter_analyzer/core/query.py +494 -502
  23. tree_sitter_analyzer/encoding_utils.py +458 -460
  24. tree_sitter_analyzer/exceptions.py +337 -340
  25. tree_sitter_analyzer/file_handler.py +217 -222
  26. tree_sitter_analyzer/formatters/__init__.py +1 -1
  27. tree_sitter_analyzer/formatters/base_formatter.py +167 -168
  28. tree_sitter_analyzer/formatters/formatter_factory.py +78 -74
  29. tree_sitter_analyzer/formatters/java_formatter.py +287 -270
  30. tree_sitter_analyzer/formatters/python_formatter.py +255 -235
  31. tree_sitter_analyzer/interfaces/__init__.py +9 -10
  32. tree_sitter_analyzer/interfaces/cli.py +528 -557
  33. tree_sitter_analyzer/interfaces/cli_adapter.py +322 -319
  34. tree_sitter_analyzer/interfaces/mcp_adapter.py +180 -170
  35. tree_sitter_analyzer/interfaces/mcp_server.py +405 -416
  36. tree_sitter_analyzer/java_analyzer.py +218 -219
  37. tree_sitter_analyzer/language_detector.py +398 -400
  38. tree_sitter_analyzer/language_loader.py +224 -228
  39. tree_sitter_analyzer/languages/__init__.py +10 -11
  40. tree_sitter_analyzer/languages/java_plugin.py +1129 -1113
  41. tree_sitter_analyzer/languages/python_plugin.py +737 -712
  42. tree_sitter_analyzer/mcp/__init__.py +31 -32
  43. tree_sitter_analyzer/mcp/resources/__init__.py +44 -47
  44. tree_sitter_analyzer/mcp/resources/code_file_resource.py +212 -213
  45. tree_sitter_analyzer/mcp/resources/project_stats_resource.py +560 -550
  46. tree_sitter_analyzer/mcp/server.py +333 -345
  47. tree_sitter_analyzer/mcp/tools/__init__.py +30 -31
  48. tree_sitter_analyzer/mcp/tools/analyze_scale_tool.py +621 -557
  49. tree_sitter_analyzer/mcp/tools/analyze_scale_tool_cli_compatible.py +242 -245
  50. tree_sitter_analyzer/mcp/tools/base_tool.py +54 -55
  51. tree_sitter_analyzer/mcp/tools/read_partial_tool.py +300 -302
  52. tree_sitter_analyzer/mcp/tools/table_format_tool.py +362 -359
  53. tree_sitter_analyzer/mcp/tools/universal_analyze_tool.py +543 -476
  54. tree_sitter_analyzer/mcp/utils/__init__.py +105 -106
  55. tree_sitter_analyzer/mcp/utils/error_handler.py +549 -549
  56. tree_sitter_analyzer/models.py +470 -481
  57. tree_sitter_analyzer/output_manager.py +261 -264
  58. tree_sitter_analyzer/plugins/__init__.py +333 -334
  59. tree_sitter_analyzer/plugins/base.py +477 -446
  60. tree_sitter_analyzer/plugins/java_plugin.py +608 -625
  61. tree_sitter_analyzer/plugins/javascript_plugin.py +446 -439
  62. tree_sitter_analyzer/plugins/manager.py +362 -355
  63. tree_sitter_analyzer/plugins/plugin_loader.py +85 -83
  64. tree_sitter_analyzer/plugins/python_plugin.py +606 -598
  65. tree_sitter_analyzer/plugins/registry.py +374 -366
  66. tree_sitter_analyzer/queries/__init__.py +26 -27
  67. tree_sitter_analyzer/queries/java.py +391 -394
  68. tree_sitter_analyzer/queries/javascript.py +148 -149
  69. tree_sitter_analyzer/queries/python.py +285 -286
  70. tree_sitter_analyzer/queries/typescript.py +229 -230
  71. tree_sitter_analyzer/query_loader.py +254 -260
  72. tree_sitter_analyzer/table_formatter.py +468 -448
  73. tree_sitter_analyzer/utils.py +277 -277
  74. tree_sitter_analyzer-0.3.0.dist-info/METADATA +346 -0
  75. tree_sitter_analyzer-0.3.0.dist-info/RECORD +77 -0
  76. tree_sitter_analyzer-0.1.3.dist-info/METADATA +0 -444
  77. tree_sitter_analyzer-0.1.3.dist-info/RECORD +0 -77
  78. {tree_sitter_analyzer-0.1.3.dist-info → tree_sitter_analyzer-0.3.0.dist-info}/WHEEL +0 -0
  79. {tree_sitter_analyzer-0.1.3.dist-info → tree_sitter_analyzer-0.3.0.dist-info}/entry_points.txt +0 -0
@@ -1,539 +1,531 @@
1
- #!/usr/bin/env python3
2
- # -*- coding: utf-8 -*-
3
- """
4
- Tree-sitter Analyzer API
5
-
6
- Public API facade that provides a stable, high-level interface to the
7
- tree-sitter analyzer framework. This is the main entry point for both
8
- CLI and MCP interfaces.
9
- """
10
-
11
- from pathlib import Path
12
- from typing import Any, Dict, List, Optional, Union
13
- import logging
14
-
15
- from .core.engine import AnalysisEngine
16
- from .utils import log_error, log_info, log_warning
17
-
18
- logger = logging.getLogger(__name__)
19
-
20
- # Global engine instance (singleton pattern)
21
- _engine: Optional[AnalysisEngine] = None
22
-
23
-
24
- def get_engine() -> AnalysisEngine:
25
- """
26
- Get the global analysis engine instance.
27
-
28
- Returns:
29
- AnalysisEngine instance
30
- """
31
- global _engine
32
- if _engine is None:
33
- _engine = AnalysisEngine()
34
- return _engine
35
-
36
-
37
- def analyze_file(
38
- file_path: Union[str, Path],
39
- language: Optional[str] = None,
40
- queries: Optional[List[str]] = None,
41
- include_elements: bool = True,
42
- include_details: bool = False, # Add for backward compatibility
43
- include_queries: bool = True,
44
- include_complexity: bool = False # Add for backward compatibility
45
- ) -> Dict[str, Any]:
46
- """
47
- Analyze a source code file.
48
-
49
- This is the main high-level function for file analysis. It handles
50
- language detection, parsing, query execution, and element extraction.
51
-
52
- Args:
53
- file_path: Path to the source file to analyze
54
- language: Programming language (auto-detected if not specified)
55
- queries: List of query names to execute (all available if not specified)
56
- include_elements: Whether to extract code elements
57
- include_queries: Whether to execute queries
58
- include_complexity: Whether to include complexity metrics (backward compatibility)
59
-
60
- Returns:
61
- Analysis results dictionary containing:
62
- - success: Whether the analysis was successful
63
- - file_info: Basic file information
64
- - language_info: Detected/specified language information
65
- - ast_info: Abstract syntax tree information
66
- - query_results: Results from executed queries (if include_queries=True)
67
- - elements: Extracted code elements (if include_elements=True)
68
- - error: Error message (if success=False)
69
- """
70
- try:
71
- engine = get_engine()
72
-
73
- # Perform the analysis
74
- analysis_result = engine.analyze_file(file_path, language)
75
-
76
- # Convert AnalysisResult to expected API format
77
- result = {
78
- "success": analysis_result.success,
79
- "file_info": {
80
- "path": str(file_path),
81
- "exists": Path(file_path).exists(),
82
- "size": Path(file_path).stat().st_size if Path(file_path).exists() else 0
83
- },
84
- "language_info": {
85
- "language": analysis_result.language,
86
- "detected": language is None # True if language was auto-detected
87
- },
88
- "ast_info": {
89
- "node_count": analysis_result.node_count,
90
- "line_count": analysis_result.line_count
91
- }
92
- }
93
-
94
- # Add elements if requested and available
95
- if include_elements and hasattr(analysis_result, 'elements'):
96
- result["elements"] = [
97
- {
98
- "name": elem.name,
99
- "type": type(elem).__name__.lower(),
100
- "start_line": elem.start_line,
101
- "end_line": elem.end_line,
102
- "raw_text": elem.raw_text,
103
- "language": elem.language
104
- }
105
- for elem in analysis_result.elements
106
- ]
107
-
108
- # Add query results if requested and available
109
- if include_queries and hasattr(analysis_result, 'query_results'):
110
- result["query_results"] = analysis_result.query_results
111
-
112
- # Add error message if analysis failed
113
- if not analysis_result.success and analysis_result.error_message:
114
- result["error"] = analysis_result.error_message
115
-
116
- # Filter results based on options
117
- if not include_elements and "elements" in result:
118
- del result["elements"]
119
-
120
- if not include_queries and "query_results" in result:
121
- del result["query_results"]
122
-
123
- return result
124
-
125
- except FileNotFoundError as e:
126
- # Re-raise FileNotFoundError for tests that expect it
127
- raise e
128
- except Exception as e:
129
- log_error(f"API analyze_file failed: {e}")
130
- return {
131
- "success": False,
132
- "error": str(e),
133
- "file_info": {"path": str(file_path), "exists": Path(file_path).exists()}
134
- }
135
-
136
-
137
- def analyze_code(
138
- source_code: str,
139
- language: str,
140
- queries: Optional[List[str]] = None,
141
- include_elements: bool = True,
142
- include_queries: bool = True
143
- ) -> Dict[str, Any]:
144
- """
145
- Analyze source code directly (without file).
146
-
147
- Args:
148
- source_code: Source code string to analyze
149
- language: Programming language
150
- queries: List of query names to execute (all available if not specified)
151
- include_elements: Whether to extract code elements
152
- include_queries: Whether to execute queries
153
-
154
- Returns:
155
- Analysis results dictionary
156
- """
157
- try:
158
- engine = get_engine()
159
-
160
- # Perform the analysis
161
- analysis_result = engine.analyze_code(source_code, language)
162
-
163
- # Convert AnalysisResult to expected API format
164
- result = {
165
- "success": analysis_result.success,
166
- "language_info": {
167
- "language": analysis_result.language,
168
- "detected": False # Language was explicitly provided
169
- },
170
- "ast_info": {
171
- "node_count": analysis_result.node_count,
172
- "line_count": analysis_result.line_count
173
- }
174
- }
175
-
176
- # Add elements if requested and available
177
- if include_elements and hasattr(analysis_result, 'elements'):
178
- result["elements"] = [
179
- {
180
- "name": elem.name,
181
- "type": type(elem).__name__.lower(),
182
- "start_line": elem.start_line,
183
- "end_line": elem.end_line,
184
- "raw_text": elem.raw_text,
185
- "language": elem.language
186
- }
187
- for elem in analysis_result.elements
188
- ]
189
-
190
- # Add query results if requested and available
191
- if include_queries and hasattr(analysis_result, 'query_results'):
192
- result["query_results"] = analysis_result.query_results
193
-
194
- # Add error message if analysis failed
195
- if not analysis_result.success and analysis_result.error_message:
196
- result["error"] = analysis_result.error_message
197
-
198
- # Filter results based on options
199
- if not include_elements and "elements" in result:
200
- del result["elements"]
201
-
202
- if not include_queries and "query_results" in result:
203
- del result["query_results"]
204
-
205
- return result
206
-
207
- except Exception as e:
208
- log_error(f"API analyze_code failed: {e}")
209
- return {
210
- "success": False,
211
- "error": str(e)
212
- }
213
-
214
-
215
- def get_supported_languages() -> List[str]:
216
- """
217
- Get list of all supported programming languages.
218
-
219
- Returns:
220
- List of supported language names
221
- """
222
- try:
223
- engine = get_engine()
224
- return engine.get_supported_languages()
225
- except Exception as e:
226
- log_error(f"Failed to get supported languages: {e}")
227
- return []
228
-
229
-
230
- def get_available_queries(language: str) -> List[str]:
231
- """
232
- Get available queries for a specific language.
233
-
234
- Args:
235
- language: Programming language name
236
-
237
- Returns:
238
- List of available query names
239
- """
240
- try:
241
- engine = get_engine()
242
- # Try to get plugin and its supported queries
243
- plugin = engine._get_language_plugin(language)
244
- if plugin and hasattr(plugin, 'get_supported_queries'):
245
- return plugin.get_supported_queries()
246
- else:
247
- # Return default queries
248
- return ['class', 'method', 'field']
249
- except Exception as e:
250
- log_error(f"Failed to get available queries for {language}: {e}")
251
- return []
252
-
253
-
254
- def is_language_supported(language: str) -> bool:
255
- """
256
- Check if a programming language is supported.
257
-
258
- Args:
259
- language: Programming language name
260
-
261
- Returns:
262
- True if the language is supported
263
- """
264
- try:
265
- supported_languages = get_supported_languages()
266
- return language.lower() in [lang.lower() for lang in supported_languages]
267
- except Exception as e:
268
- log_error(f"Failed to check language support for {language}: {e}")
269
- return False
270
-
271
-
272
- def detect_language(file_path: Union[str, Path]) -> Optional[str]:
273
- """
274
- Detect programming language from file path.
275
-
276
- Args:
277
- file_path: Path to the file
278
-
279
- Returns:
280
- Detected language name or None
281
- """
282
- try:
283
- engine = get_engine()
284
- # Use language_detector instead of language_registry
285
- return engine.language_detector.detect_from_extension(str(file_path))
286
- except Exception as e:
287
- log_error(f"Failed to detect language for {file_path}: {e}")
288
- return None
289
-
290
-
291
- def get_file_extensions(language: str) -> List[str]:
292
- """
293
- Get file extensions for a specific language.
294
-
295
- Args:
296
- language: Programming language name
297
-
298
- Returns:
299
- List of file extensions
300
- """
301
- try:
302
- engine = get_engine()
303
- # Use language_detector to get extensions
304
- if hasattr(engine.language_detector, 'get_extensions_for_language'):
305
- return engine.language_detector.get_extensions_for_language(language)
306
- else:
307
- # Fallback: return common extensions
308
- extension_map = {
309
- 'java': ['.java'],
310
- 'python': ['.py'],
311
- 'javascript': ['.js'],
312
- 'typescript': ['.ts'],
313
- 'c': ['.c'],
314
- 'cpp': ['.cpp', '.cxx', '.cc'],
315
- 'go': ['.go'],
316
- 'rust': ['.rs']
317
- }
318
- return extension_map.get(language.lower(), [])
319
- except Exception as e:
320
- log_error(f"Failed to get extensions for {language}: {e}")
321
- return []
322
-
323
-
324
- def validate_file(file_path: Union[str, Path]) -> Dict[str, Any]:
325
- """
326
- Validate a source code file without full analysis.
327
-
328
- Args:
329
- file_path: Path to the file to validate
330
-
331
- Returns:
332
- Validation results dictionary
333
- """
334
- file_path = Path(file_path)
335
-
336
- result = {
337
- "valid": False,
338
- "exists": file_path.exists(),
339
- "readable": False,
340
- "language": None,
341
- "supported": False,
342
- "size": 0,
343
- "errors": []
344
- }
345
-
346
- try:
347
- # Check if file exists
348
- if not file_path.exists():
349
- result["errors"].append("File does not exist")
350
- return result
351
-
352
- # Check if file is readable
353
- try:
354
- with open(file_path, 'r', encoding='utf-8') as f:
355
- content = f.read(100) # Read first 100 chars to test
356
- result["readable"] = True
357
- result["size"] = file_path.stat().st_size
358
- except Exception as e:
359
- result["errors"].append(f"File is not readable: {e}")
360
- return result
361
-
362
- # Detect language
363
- language = detect_language(file_path)
364
- result["language"] = language
365
-
366
- if language:
367
- result["supported"] = is_language_supported(language)
368
- if not result["supported"]:
369
- result["errors"].append(f"Language '{language}' is not supported")
370
- else:
371
- result["errors"].append("Could not detect programming language")
372
-
373
- # If we got this far with no errors, the file is valid
374
- result["valid"] = len(result["errors"]) == 0
375
-
376
- except Exception as e:
377
- result["errors"].append(f"Validation failed: {e}")
378
-
379
- return result
380
-
381
-
382
- def get_framework_info() -> Dict[str, Any]:
383
- """
384
- Get information about the framework and its capabilities.
385
-
386
- Returns:
387
- Framework information dictionary
388
- """
389
- try:
390
- engine = get_engine()
391
-
392
- return {
393
- "name": "tree-sitter-analyzer",
394
- "version": "2.0.0", # New architecture version
395
- "supported_languages": engine.get_supported_languages(),
396
- "total_languages": len(engine.get_supported_languages()),
397
- "plugin_info": {
398
- "manager_available": engine.plugin_manager is not None,
399
- "loaded_plugins": len(engine.plugin_manager.get_supported_languages()) if engine.plugin_manager else 0
400
- },
401
- "core_components": [
402
- "AnalysisEngine",
403
- "Parser",
404
- "QueryExecutor",
405
- "PluginManager",
406
- "LanguageDetector"
407
- ]
408
- }
409
- except Exception as e:
410
- log_error(f"Failed to get framework info: {e}")
411
- return {
412
- "name": "tree-sitter-analyzer",
413
- "version": "2.0.0",
414
- "error": str(e)
415
- }
416
-
417
-
418
- def execute_query(
419
- file_path: Union[str, Path],
420
- query_name: str,
421
- language: Optional[str] = None
422
- ) -> Dict[str, Any]:
423
- """
424
- Execute a specific query against a file.
425
-
426
- Args:
427
- file_path: Path to the source file
428
- query_name: Name of the query to execute
429
- language: Programming language (auto-detected if not specified)
430
-
431
- Returns:
432
- Query execution results
433
- """
434
- try:
435
- # Analyze with only the specified query
436
- result = analyze_file(
437
- file_path,
438
- language=language,
439
- queries=[query_name],
440
- include_elements=False,
441
- include_queries=True
442
- )
443
-
444
- if result["success"] and "query_results" in result:
445
- query_results = result["query_results"].get(query_name, [])
446
- return {
447
- "success": True,
448
- "query_name": query_name,
449
- "results": query_results,
450
- "count": len(query_results),
451
- "language": result.get("language_info", {}).get("language"),
452
- "file_path": str(file_path)
453
- }
454
- else:
455
- return {
456
- "success": False,
457
- "query_name": query_name,
458
- "error": result.get("error", "Unknown error"),
459
- "file_path": str(file_path)
460
- }
461
-
462
- except Exception as e:
463
- log_error(f"Query execution failed: {e}")
464
- return {
465
- "success": False,
466
- "query_name": query_name,
467
- "error": str(e),
468
- "file_path": str(file_path)
469
- }
470
-
471
-
472
- def extract_elements(
473
- file_path: Union[str, Path],
474
- language: Optional[str] = None,
475
- element_types: Optional[List[str]] = None
476
- ) -> Dict[str, Any]:
477
- """
478
- Extract code elements from a file.
479
-
480
- Args:
481
- file_path: Path to the source file
482
- language: Programming language (auto-detected if not specified)
483
- element_types: Types of elements to extract (all if not specified)
484
-
485
- Returns:
486
- Element extraction results
487
- """
488
- try:
489
- # Analyze with only element extraction
490
- result = analyze_file(
491
- file_path,
492
- language=language,
493
- include_elements=True,
494
- include_queries=False
495
- )
496
-
497
- if result["success"] and "elements" in result:
498
- elements = result["elements"]
499
-
500
- # Filter by element types if specified
501
- if element_types:
502
- filtered_elements = []
503
- for element in elements:
504
- if any(etype.lower() in element.get("type", "").lower() for etype in element_types):
505
- filtered_elements.append(element)
506
- elements = filtered_elements
507
-
508
- return {
509
- "success": True,
510
- "elements": elements,
511
- "count": len(elements),
512
- "language": result.get("language_info", {}).get("language"),
513
- "file_path": str(file_path)
514
- }
515
- else:
516
- return {
517
- "success": False,
518
- "error": result.get("error", "Unknown error"),
519
- "file_path": str(file_path)
520
- }
521
-
522
- except Exception as e:
523
- log_error(f"Element extraction failed: {e}")
524
- return {
525
- "success": False,
526
- "error": str(e),
527
- "file_path": str(file_path)
528
- }
529
-
530
-
531
- # Convenience functions for backward compatibility
532
- def analyze(file_path: Union[str, Path], **kwargs) -> Dict[str, Any]:
533
- """Convenience function that aliases to analyze_file."""
534
- return analyze_file(file_path, **kwargs)
535
-
536
-
537
- def get_languages() -> List[str]:
538
- """Convenience function that aliases to get_supported_languages."""
539
- return get_supported_languages()
1
+ #!/usr/bin/env python3
2
+ """
3
+ Tree-sitter Analyzer API
4
+
5
+ Public API facade that provides a stable, high-level interface to the
6
+ tree-sitter analyzer framework. This is the main entry point for both
7
+ CLI and MCP interfaces.
8
+ """
9
+
10
+ import logging
11
+ from pathlib import Path
12
+ from typing import Any
13
+
14
+ from .core.engine import AnalysisEngine
15
+ from .utils import log_error
16
+
17
+ logger = logging.getLogger(__name__)
18
+
19
+ # Global engine instance (singleton pattern)
20
+ _engine: AnalysisEngine | None = None
21
+
22
+
23
+ def get_engine() -> AnalysisEngine:
24
+ """
25
+ Get the global analysis engine instance.
26
+
27
+ Returns:
28
+ AnalysisEngine instance
29
+ """
30
+ global _engine
31
+ if _engine is None:
32
+ _engine = AnalysisEngine()
33
+ return _engine
34
+
35
+
36
+ def analyze_file(
37
+ file_path: str | Path,
38
+ language: str | None = None,
39
+ queries: list[str] | None = None,
40
+ include_elements: bool = True,
41
+ include_details: bool = False, # Add for backward compatibility
42
+ include_queries: bool = True,
43
+ include_complexity: bool = False, # Add for backward compatibility
44
+ ) -> dict[str, Any]:
45
+ """
46
+ Analyze a source code file.
47
+
48
+ This is the main high-level function for file analysis. It handles
49
+ language detection, parsing, query execution, and element extraction.
50
+
51
+ Args:
52
+ file_path: Path to the source file to analyze
53
+ language: Programming language (auto-detected if not specified)
54
+ queries: List of query names to execute (all available if not specified)
55
+ include_elements: Whether to extract code elements
56
+ include_queries: Whether to execute queries
57
+ include_complexity: Whether to include complexity metrics (backward compatibility)
58
+
59
+ Returns:
60
+ Analysis results dictionary containing:
61
+ - success: Whether the analysis was successful
62
+ - file_info: Basic file information
63
+ - language_info: Detected/specified language information
64
+ - ast_info: Abstract syntax tree information
65
+ - query_results: Results from executed queries (if include_queries=True)
66
+ - elements: Extracted code elements (if include_elements=True)
67
+ - error: Error message (if success=False)
68
+ """
69
+ try:
70
+ engine = get_engine()
71
+
72
+ # Perform the analysis
73
+ analysis_result = engine.analyze_file(file_path, language)
74
+
75
+ # Convert AnalysisResult to expected API format
76
+ result = {
77
+ "success": analysis_result.success,
78
+ "file_info": {
79
+ "path": str(file_path),
80
+ "exists": Path(file_path).exists(),
81
+ "size": (
82
+ Path(file_path).stat().st_size if Path(file_path).exists() else 0
83
+ ),
84
+ },
85
+ "language_info": {
86
+ "language": analysis_result.language,
87
+ "detected": language is None, # True if language was auto-detected
88
+ },
89
+ "ast_info": {
90
+ "node_count": analysis_result.node_count,
91
+ "line_count": analysis_result.line_count,
92
+ },
93
+ }
94
+
95
+ # Add elements if requested and available
96
+ if include_elements and hasattr(analysis_result, "elements"):
97
+ result["elements"] = [
98
+ {
99
+ "name": elem.name,
100
+ "type": type(elem).__name__.lower(),
101
+ "start_line": elem.start_line,
102
+ "end_line": elem.end_line,
103
+ "raw_text": elem.raw_text,
104
+ "language": elem.language,
105
+ }
106
+ for elem in analysis_result.elements
107
+ ]
108
+
109
+ # Add query results if requested and available
110
+ if include_queries and hasattr(analysis_result, "query_results"):
111
+ result["query_results"] = analysis_result.query_results
112
+
113
+ # Add error message if analysis failed
114
+ if not analysis_result.success and analysis_result.error_message:
115
+ result["error"] = analysis_result.error_message
116
+
117
+ # Filter results based on options
118
+ if not include_elements and "elements" in result:
119
+ del result["elements"]
120
+
121
+ if not include_queries and "query_results" in result:
122
+ del result["query_results"]
123
+
124
+ return result
125
+
126
+ except FileNotFoundError as e:
127
+ # Re-raise FileNotFoundError for tests that expect it
128
+ raise e
129
+ except Exception as e:
130
+ log_error(f"API analyze_file failed: {e}")
131
+ return {
132
+ "success": False,
133
+ "error": str(e),
134
+ "file_info": {"path": str(file_path), "exists": Path(file_path).exists()},
135
+ }
136
+
137
+
138
+ def analyze_code(
139
+ source_code: str,
140
+ language: str,
141
+ queries: list[str] | None = None,
142
+ include_elements: bool = True,
143
+ include_queries: bool = True,
144
+ ) -> dict[str, Any]:
145
+ """
146
+ Analyze source code directly (without file).
147
+
148
+ Args:
149
+ source_code: Source code string to analyze
150
+ language: Programming language
151
+ queries: List of query names to execute (all available if not specified)
152
+ include_elements: Whether to extract code elements
153
+ include_queries: Whether to execute queries
154
+
155
+ Returns:
156
+ Analysis results dictionary
157
+ """
158
+ try:
159
+ engine = get_engine()
160
+
161
+ # Perform the analysis
162
+ analysis_result = engine.analyze_code(source_code, language)
163
+
164
+ # Convert AnalysisResult to expected API format
165
+ result = {
166
+ "success": analysis_result.success,
167
+ "language_info": {
168
+ "language": analysis_result.language,
169
+ "detected": False, # Language was explicitly provided
170
+ },
171
+ "ast_info": {
172
+ "node_count": analysis_result.node_count,
173
+ "line_count": analysis_result.line_count,
174
+ },
175
+ }
176
+
177
+ # Add elements if requested and available
178
+ if include_elements and hasattr(analysis_result, "elements"):
179
+ result["elements"] = [
180
+ {
181
+ "name": elem.name,
182
+ "type": type(elem).__name__.lower(),
183
+ "start_line": elem.start_line,
184
+ "end_line": elem.end_line,
185
+ "raw_text": elem.raw_text,
186
+ "language": elem.language,
187
+ }
188
+ for elem in analysis_result.elements
189
+ ]
190
+
191
+ # Add query results if requested and available
192
+ if include_queries and hasattr(analysis_result, "query_results"):
193
+ result["query_results"] = analysis_result.query_results
194
+
195
+ # Add error message if analysis failed
196
+ if not analysis_result.success and analysis_result.error_message:
197
+ result["error"] = analysis_result.error_message
198
+
199
+ # Filter results based on options
200
+ if not include_elements and "elements" in result:
201
+ del result["elements"]
202
+
203
+ if not include_queries and "query_results" in result:
204
+ del result["query_results"]
205
+
206
+ return result
207
+
208
+ except Exception as e:
209
+ log_error(f"API analyze_code failed: {e}")
210
+ return {"success": False, "error": str(e)}
211
+
212
+
213
+ def get_supported_languages() -> list[str]:
214
+ """
215
+ Get list of all supported programming languages.
216
+
217
+ Returns:
218
+ List of supported language names
219
+ """
220
+ try:
221
+ engine = get_engine()
222
+ return engine.get_supported_languages()
223
+ except Exception as e:
224
+ log_error(f"Failed to get supported languages: {e}")
225
+ return []
226
+
227
+
228
+ def get_available_queries(language: str) -> list[str]:
229
+ """
230
+ Get available queries for a specific language.
231
+
232
+ Args:
233
+ language: Programming language name
234
+
235
+ Returns:
236
+ List of available query names
237
+ """
238
+ try:
239
+ engine = get_engine()
240
+ # Try to get plugin and its supported queries
241
+ plugin = engine._get_language_plugin(language)
242
+ if plugin and hasattr(plugin, "get_supported_queries"):
243
+ return plugin.get_supported_queries()
244
+ else:
245
+ # Return default queries
246
+ return ["class", "method", "field"]
247
+ except Exception as e:
248
+ log_error(f"Failed to get available queries for {language}: {e}")
249
+ return []
250
+
251
+
252
+ def is_language_supported(language: str) -> bool:
253
+ """
254
+ Check if a programming language is supported.
255
+
256
+ Args:
257
+ language: Programming language name
258
+
259
+ Returns:
260
+ True if the language is supported
261
+ """
262
+ try:
263
+ supported_languages = get_supported_languages()
264
+ return language.lower() in [lang.lower() for lang in supported_languages]
265
+ except Exception as e:
266
+ log_error(f"Failed to check language support for {language}: {e}")
267
+ return False
268
+
269
+
270
+ def detect_language(file_path: str | Path) -> str | None:
271
+ """
272
+ Detect programming language from file path.
273
+
274
+ Args:
275
+ file_path: Path to the file
276
+
277
+ Returns:
278
+ Detected language name or None
279
+ """
280
+ try:
281
+ engine = get_engine()
282
+ # Use language_detector instead of language_registry
283
+ return engine.language_detector.detect_from_extension(str(file_path))
284
+ except Exception as e:
285
+ log_error(f"Failed to detect language for {file_path}: {e}")
286
+ return None
287
+
288
+
289
+ def get_file_extensions(language: str) -> list[str]:
290
+ """
291
+ Get file extensions for a specific language.
292
+
293
+ Args:
294
+ language: Programming language name
295
+
296
+ Returns:
297
+ List of file extensions
298
+ """
299
+ try:
300
+ engine = get_engine()
301
+ # Use language_detector to get extensions
302
+ if hasattr(engine.language_detector, "get_extensions_for_language"):
303
+ return engine.language_detector.get_extensions_for_language(language)
304
+ else:
305
+ # Fallback: return common extensions
306
+ extension_map = {
307
+ "java": [".java"],
308
+ "python": [".py"],
309
+ "javascript": [".js"],
310
+ "typescript": [".ts"],
311
+ "c": [".c"],
312
+ "cpp": [".cpp", ".cxx", ".cc"],
313
+ "go": [".go"],
314
+ "rust": [".rs"],
315
+ }
316
+ return extension_map.get(language.lower(), [])
317
+ except Exception as e:
318
+ log_error(f"Failed to get extensions for {language}: {e}")
319
+ return []
320
+
321
+
322
+ def validate_file(file_path: str | Path) -> dict[str, Any]:
323
+ """
324
+ Validate a source code file without full analysis.
325
+
326
+ Args:
327
+ file_path: Path to the file to validate
328
+
329
+ Returns:
330
+ Validation results dictionary
331
+ """
332
+ file_path = Path(file_path)
333
+
334
+ result: dict[str, Any] = {
335
+ "valid": False,
336
+ "exists": file_path.exists(),
337
+ "readable": False,
338
+ "language": None,
339
+ "supported": False,
340
+ "size": 0,
341
+ "errors": [],
342
+ }
343
+
344
+ try:
345
+ # Check if file exists
346
+ if not file_path.exists():
347
+ result["errors"].append("File does not exist")
348
+ return result
349
+
350
+ # Check if file is readable
351
+ try:
352
+ with open(file_path, encoding="utf-8") as f:
353
+ f.read(100) # Read first 100 chars to test
354
+ result["readable"] = True
355
+ result["size"] = file_path.stat().st_size
356
+ except Exception as e:
357
+ result["errors"].append(f"File is not readable: {e}")
358
+ return result
359
+
360
+ # Detect language
361
+ language = detect_language(file_path)
362
+ result["language"] = language
363
+
364
+ if language:
365
+ result["supported"] = is_language_supported(language)
366
+ if not result["supported"]:
367
+ result["errors"].append(f"Language '{language}' is not supported")
368
+ else:
369
+ result["errors"].append("Could not detect programming language")
370
+
371
+ # If we got this far with no errors, the file is valid
372
+ result["valid"] = len(result["errors"]) == 0
373
+
374
+ except Exception as e:
375
+ result["errors"].append(f"Validation failed: {e}")
376
+
377
+ return result
378
+
379
+
380
+ def get_framework_info() -> dict[str, Any]:
381
+ """
382
+ Get information about the framework and its capabilities.
383
+
384
+ Returns:
385
+ Framework information dictionary
386
+ """
387
+ try:
388
+ engine = get_engine()
389
+
390
+ return {
391
+ "name": "tree-sitter-analyzer",
392
+ "version": "2.0.0", # New architecture version
393
+ "supported_languages": engine.get_supported_languages(),
394
+ "total_languages": len(engine.get_supported_languages()),
395
+ "plugin_info": {
396
+ "manager_available": engine.plugin_manager is not None,
397
+ "loaded_plugins": (
398
+ len(engine.plugin_manager.get_supported_languages())
399
+ if engine.plugin_manager
400
+ else 0
401
+ ),
402
+ },
403
+ "core_components": [
404
+ "AnalysisEngine",
405
+ "Parser",
406
+ "QueryExecutor",
407
+ "PluginManager",
408
+ "LanguageDetector",
409
+ ],
410
+ }
411
+ except Exception as e:
412
+ log_error(f"Failed to get framework info: {e}")
413
+ return {"name": "tree-sitter-analyzer", "version": "2.0.0", "error": str(e)}
414
+
415
+
416
+ def execute_query(
417
+ file_path: str | Path, query_name: str, language: str | None = None
418
+ ) -> dict[str, Any]:
419
+ """
420
+ Execute a specific query against a file.
421
+
422
+ Args:
423
+ file_path: Path to the source file
424
+ query_name: Name of the query to execute
425
+ language: Programming language (auto-detected if not specified)
426
+
427
+ Returns:
428
+ Query execution results
429
+ """
430
+ try:
431
+ # Analyze with only the specified query
432
+ result = analyze_file(
433
+ file_path,
434
+ language=language,
435
+ queries=[query_name],
436
+ include_elements=False,
437
+ include_queries=True,
438
+ )
439
+
440
+ if result["success"] and "query_results" in result:
441
+ query_results = result["query_results"].get(query_name, [])
442
+ return {
443
+ "success": True,
444
+ "query_name": query_name,
445
+ "results": query_results,
446
+ "count": len(query_results),
447
+ "language": result.get("language_info", {}).get("language"),
448
+ "file_path": str(file_path),
449
+ }
450
+ else:
451
+ return {
452
+ "success": False,
453
+ "query_name": query_name,
454
+ "error": result.get("error", "Unknown error"),
455
+ "file_path": str(file_path),
456
+ }
457
+
458
+ except Exception as e:
459
+ log_error(f"Query execution failed: {e}")
460
+ return {
461
+ "success": False,
462
+ "query_name": query_name,
463
+ "error": str(e),
464
+ "file_path": str(file_path),
465
+ }
466
+
467
+
468
+ def extract_elements(
469
+ file_path: str | Path,
470
+ language: str | None = None,
471
+ element_types: list[str] | None = None,
472
+ ) -> dict[str, Any]:
473
+ """
474
+ Extract code elements from a file.
475
+
476
+ Args:
477
+ file_path: Path to the source file
478
+ language: Programming language (auto-detected if not specified)
479
+ element_types: Types of elements to extract (all if not specified)
480
+
481
+ Returns:
482
+ Element extraction results
483
+ """
484
+ try:
485
+ # Analyze with only element extraction
486
+ result = analyze_file(
487
+ file_path, language=language, include_elements=True, include_queries=False
488
+ )
489
+
490
+ if result["success"] and "elements" in result:
491
+ elements = result["elements"]
492
+
493
+ # Filter by element types if specified
494
+ if element_types:
495
+ filtered_elements = []
496
+ for element in elements:
497
+ if any(
498
+ etype.lower() in element.get("type", "").lower()
499
+ for etype in element_types
500
+ ):
501
+ filtered_elements.append(element)
502
+ elements = filtered_elements
503
+
504
+ return {
505
+ "success": True,
506
+ "elements": elements,
507
+ "count": len(elements),
508
+ "language": result.get("language_info", {}).get("language"),
509
+ "file_path": str(file_path),
510
+ }
511
+ else:
512
+ return {
513
+ "success": False,
514
+ "error": result.get("error", "Unknown error"),
515
+ "file_path": str(file_path),
516
+ }
517
+
518
+ except Exception as e:
519
+ log_error(f"Element extraction failed: {e}")
520
+ return {"success": False, "error": str(e), "file_path": str(file_path)}
521
+
522
+
523
+ # Convenience functions for backward compatibility
524
+ def analyze(file_path: str | Path, **kwargs: Any) -> dict[str, Any]:
525
+ """Convenience function that aliases to analyze_file."""
526
+ return analyze_file(file_path, **kwargs)
527
+
528
+
529
+ def get_languages() -> list[str]:
530
+ """Convenience function that aliases to get_supported_languages."""
531
+ return get_supported_languages()