tree-sitter-analyzer 0.2.0__py3-none-any.whl → 0.4.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of tree-sitter-analyzer might be problematic. Click here for more details.

Files changed (78) hide show
  1. tree_sitter_analyzer/__init__.py +134 -121
  2. tree_sitter_analyzer/__main__.py +11 -12
  3. tree_sitter_analyzer/api.py +533 -539
  4. tree_sitter_analyzer/cli/__init__.py +39 -39
  5. tree_sitter_analyzer/cli/__main__.py +12 -13
  6. tree_sitter_analyzer/cli/commands/__init__.py +26 -27
  7. tree_sitter_analyzer/cli/commands/advanced_command.py +88 -88
  8. tree_sitter_analyzer/cli/commands/base_command.py +160 -155
  9. tree_sitter_analyzer/cli/commands/default_command.py +18 -19
  10. tree_sitter_analyzer/cli/commands/partial_read_command.py +141 -133
  11. tree_sitter_analyzer/cli/commands/query_command.py +81 -82
  12. tree_sitter_analyzer/cli/commands/structure_command.py +138 -121
  13. tree_sitter_analyzer/cli/commands/summary_command.py +101 -93
  14. tree_sitter_analyzer/cli/commands/table_command.py +235 -233
  15. tree_sitter_analyzer/cli/info_commands.py +120 -121
  16. tree_sitter_analyzer/cli_main.py +278 -276
  17. tree_sitter_analyzer/core/__init__.py +15 -20
  18. tree_sitter_analyzer/core/analysis_engine.py +555 -574
  19. tree_sitter_analyzer/core/cache_service.py +320 -330
  20. tree_sitter_analyzer/core/engine.py +559 -560
  21. tree_sitter_analyzer/core/parser.py +293 -288
  22. tree_sitter_analyzer/core/query.py +502 -502
  23. tree_sitter_analyzer/encoding_utils.py +456 -460
  24. tree_sitter_analyzer/exceptions.py +337 -340
  25. tree_sitter_analyzer/file_handler.py +210 -222
  26. tree_sitter_analyzer/formatters/__init__.py +1 -1
  27. tree_sitter_analyzer/formatters/base_formatter.py +167 -168
  28. tree_sitter_analyzer/formatters/formatter_factory.py +78 -74
  29. tree_sitter_analyzer/formatters/java_formatter.py +291 -270
  30. tree_sitter_analyzer/formatters/python_formatter.py +259 -235
  31. tree_sitter_analyzer/interfaces/__init__.py +9 -10
  32. tree_sitter_analyzer/interfaces/cli.py +528 -557
  33. tree_sitter_analyzer/interfaces/cli_adapter.py +343 -319
  34. tree_sitter_analyzer/interfaces/mcp_adapter.py +206 -170
  35. tree_sitter_analyzer/interfaces/mcp_server.py +405 -416
  36. tree_sitter_analyzer/java_analyzer.py +187 -219
  37. tree_sitter_analyzer/language_detector.py +398 -400
  38. tree_sitter_analyzer/language_loader.py +224 -228
  39. tree_sitter_analyzer/languages/__init__.py +10 -11
  40. tree_sitter_analyzer/languages/java_plugin.py +1174 -1113
  41. tree_sitter_analyzer/{plugins → languages}/javascript_plugin.py +446 -439
  42. tree_sitter_analyzer/languages/python_plugin.py +747 -712
  43. tree_sitter_analyzer/mcp/__init__.py +31 -32
  44. tree_sitter_analyzer/mcp/resources/__init__.py +44 -47
  45. tree_sitter_analyzer/mcp/resources/code_file_resource.py +209 -213
  46. tree_sitter_analyzer/mcp/resources/project_stats_resource.py +555 -550
  47. tree_sitter_analyzer/mcp/server.py +333 -345
  48. tree_sitter_analyzer/mcp/tools/__init__.py +30 -31
  49. tree_sitter_analyzer/mcp/tools/analyze_scale_tool.py +654 -557
  50. tree_sitter_analyzer/mcp/tools/analyze_scale_tool_cli_compatible.py +247 -245
  51. tree_sitter_analyzer/mcp/tools/base_tool.py +54 -55
  52. tree_sitter_analyzer/mcp/tools/read_partial_tool.py +300 -302
  53. tree_sitter_analyzer/mcp/tools/table_format_tool.py +362 -359
  54. tree_sitter_analyzer/mcp/tools/universal_analyze_tool.py +543 -476
  55. tree_sitter_analyzer/mcp/utils/__init__.py +107 -106
  56. tree_sitter_analyzer/mcp/utils/error_handler.py +549 -549
  57. tree_sitter_analyzer/models.py +470 -481
  58. tree_sitter_analyzer/output_manager.py +255 -264
  59. tree_sitter_analyzer/plugins/__init__.py +280 -334
  60. tree_sitter_analyzer/plugins/base.py +496 -446
  61. tree_sitter_analyzer/plugins/manager.py +379 -355
  62. tree_sitter_analyzer/queries/__init__.py +26 -27
  63. tree_sitter_analyzer/queries/java.py +391 -394
  64. tree_sitter_analyzer/queries/javascript.py +148 -149
  65. tree_sitter_analyzer/queries/python.py +285 -286
  66. tree_sitter_analyzer/queries/typescript.py +229 -230
  67. tree_sitter_analyzer/query_loader.py +257 -260
  68. tree_sitter_analyzer/table_formatter.py +471 -448
  69. tree_sitter_analyzer/utils.py +277 -277
  70. {tree_sitter_analyzer-0.2.0.dist-info → tree_sitter_analyzer-0.4.0.dist-info}/METADATA +23 -8
  71. tree_sitter_analyzer-0.4.0.dist-info/RECORD +73 -0
  72. {tree_sitter_analyzer-0.2.0.dist-info → tree_sitter_analyzer-0.4.0.dist-info}/entry_points.txt +2 -1
  73. tree_sitter_analyzer/plugins/java_plugin.py +0 -625
  74. tree_sitter_analyzer/plugins/plugin_loader.py +0 -83
  75. tree_sitter_analyzer/plugins/python_plugin.py +0 -598
  76. tree_sitter_analyzer/plugins/registry.py +0 -366
  77. tree_sitter_analyzer-0.2.0.dist-info/RECORD +0 -77
  78. {tree_sitter_analyzer-0.2.0.dist-info → tree_sitter_analyzer-0.4.0.dist-info}/WHEEL +0 -0
@@ -1,539 +1,533 @@
1
- #!/usr/bin/env python3
2
- # -*- coding: utf-8 -*-
3
- """
4
- Tree-sitter Analyzer API
5
-
6
- Public API facade that provides a stable, high-level interface to the
7
- tree-sitter analyzer framework. This is the main entry point for both
8
- CLI and MCP interfaces.
9
- """
10
-
11
- from pathlib import Path
12
- from typing import Any, Dict, List, Optional, Union
13
- import logging
14
-
15
- from .core.engine import AnalysisEngine
16
- from .utils import log_error, log_info, log_warning
17
-
18
- logger = logging.getLogger(__name__)
19
-
20
- # Global engine instance (singleton pattern)
21
- _engine: Optional[AnalysisEngine] = None
22
-
23
-
24
- def get_engine() -> AnalysisEngine:
25
- """
26
- Get the global analysis engine instance.
27
-
28
- Returns:
29
- AnalysisEngine instance
30
- """
31
- global _engine
32
- if _engine is None:
33
- _engine = AnalysisEngine()
34
- return _engine
35
-
36
-
37
- def analyze_file(
38
- file_path: Union[str, Path],
39
- language: Optional[str] = None,
40
- queries: Optional[List[str]] = None,
41
- include_elements: bool = True,
42
- include_details: bool = False, # Add for backward compatibility
43
- include_queries: bool = True,
44
- include_complexity: bool = False # Add for backward compatibility
45
- ) -> Dict[str, Any]:
46
- """
47
- Analyze a source code file.
48
-
49
- This is the main high-level function for file analysis. It handles
50
- language detection, parsing, query execution, and element extraction.
51
-
52
- Args:
53
- file_path: Path to the source file to analyze
54
- language: Programming language (auto-detected if not specified)
55
- queries: List of query names to execute (all available if not specified)
56
- include_elements: Whether to extract code elements
57
- include_queries: Whether to execute queries
58
- include_complexity: Whether to include complexity metrics (backward compatibility)
59
-
60
- Returns:
61
- Analysis results dictionary containing:
62
- - success: Whether the analysis was successful
63
- - file_info: Basic file information
64
- - language_info: Detected/specified language information
65
- - ast_info: Abstract syntax tree information
66
- - query_results: Results from executed queries (if include_queries=True)
67
- - elements: Extracted code elements (if include_elements=True)
68
- - error: Error message (if success=False)
69
- """
70
- try:
71
- engine = get_engine()
72
-
73
- # Perform the analysis
74
- analysis_result = engine.analyze_file(file_path, language)
75
-
76
- # Convert AnalysisResult to expected API format
77
- result = {
78
- "success": analysis_result.success,
79
- "file_info": {
80
- "path": str(file_path),
81
- "exists": Path(file_path).exists(),
82
- "size": Path(file_path).stat().st_size if Path(file_path).exists() else 0
83
- },
84
- "language_info": {
85
- "language": analysis_result.language,
86
- "detected": language is None # True if language was auto-detected
87
- },
88
- "ast_info": {
89
- "node_count": analysis_result.node_count,
90
- "line_count": analysis_result.line_count
91
- }
92
- }
93
-
94
- # Add elements if requested and available
95
- if include_elements and hasattr(analysis_result, 'elements'):
96
- result["elements"] = [
97
- {
98
- "name": elem.name,
99
- "type": type(elem).__name__.lower(),
100
- "start_line": elem.start_line,
101
- "end_line": elem.end_line,
102
- "raw_text": elem.raw_text,
103
- "language": elem.language
104
- }
105
- for elem in analysis_result.elements
106
- ]
107
-
108
- # Add query results if requested and available
109
- if include_queries and hasattr(analysis_result, 'query_results'):
110
- result["query_results"] = analysis_result.query_results
111
-
112
- # Add error message if analysis failed
113
- if not analysis_result.success and analysis_result.error_message:
114
- result["error"] = analysis_result.error_message
115
-
116
- # Filter results based on options
117
- if not include_elements and "elements" in result:
118
- del result["elements"]
119
-
120
- if not include_queries and "query_results" in result:
121
- del result["query_results"]
122
-
123
- return result
124
-
125
- except FileNotFoundError as e:
126
- # Re-raise FileNotFoundError for tests that expect it
127
- raise e
128
- except Exception as e:
129
- log_error(f"API analyze_file failed: {e}")
130
- return {
131
- "success": False,
132
- "error": str(e),
133
- "file_info": {"path": str(file_path), "exists": Path(file_path).exists()}
134
- }
135
-
136
-
137
- def analyze_code(
138
- source_code: str,
139
- language: str,
140
- queries: Optional[List[str]] = None,
141
- include_elements: bool = True,
142
- include_queries: bool = True
143
- ) -> Dict[str, Any]:
144
- """
145
- Analyze source code directly (without file).
146
-
147
- Args:
148
- source_code: Source code string to analyze
149
- language: Programming language
150
- queries: List of query names to execute (all available if not specified)
151
- include_elements: Whether to extract code elements
152
- include_queries: Whether to execute queries
153
-
154
- Returns:
155
- Analysis results dictionary
156
- """
157
- try:
158
- engine = get_engine()
159
-
160
- # Perform the analysis
161
- analysis_result = engine.analyze_code(source_code, language)
162
-
163
- # Convert AnalysisResult to expected API format
164
- result = {
165
- "success": analysis_result.success,
166
- "language_info": {
167
- "language": analysis_result.language,
168
- "detected": False # Language was explicitly provided
169
- },
170
- "ast_info": {
171
- "node_count": analysis_result.node_count,
172
- "line_count": analysis_result.line_count
173
- }
174
- }
175
-
176
- # Add elements if requested and available
177
- if include_elements and hasattr(analysis_result, 'elements'):
178
- result["elements"] = [
179
- {
180
- "name": elem.name,
181
- "type": type(elem).__name__.lower(),
182
- "start_line": elem.start_line,
183
- "end_line": elem.end_line,
184
- "raw_text": elem.raw_text,
185
- "language": elem.language
186
- }
187
- for elem in analysis_result.elements
188
- ]
189
-
190
- # Add query results if requested and available
191
- if include_queries and hasattr(analysis_result, 'query_results'):
192
- result["query_results"] = analysis_result.query_results
193
-
194
- # Add error message if analysis failed
195
- if not analysis_result.success and analysis_result.error_message:
196
- result["error"] = analysis_result.error_message
197
-
198
- # Filter results based on options
199
- if not include_elements and "elements" in result:
200
- del result["elements"]
201
-
202
- if not include_queries and "query_results" in result:
203
- del result["query_results"]
204
-
205
- return result
206
-
207
- except Exception as e:
208
- log_error(f"API analyze_code failed: {e}")
209
- return {
210
- "success": False,
211
- "error": str(e)
212
- }
213
-
214
-
215
- def get_supported_languages() -> List[str]:
216
- """
217
- Get list of all supported programming languages.
218
-
219
- Returns:
220
- List of supported language names
221
- """
222
- try:
223
- engine = get_engine()
224
- return engine.get_supported_languages()
225
- except Exception as e:
226
- log_error(f"Failed to get supported languages: {e}")
227
- return []
228
-
229
-
230
- def get_available_queries(language: str) -> List[str]:
231
- """
232
- Get available queries for a specific language.
233
-
234
- Args:
235
- language: Programming language name
236
-
237
- Returns:
238
- List of available query names
239
- """
240
- try:
241
- engine = get_engine()
242
- # Try to get plugin and its supported queries
243
- plugin = engine._get_language_plugin(language)
244
- if plugin and hasattr(plugin, 'get_supported_queries'):
245
- return plugin.get_supported_queries()
246
- else:
247
- # Return default queries
248
- return ['class', 'method', 'field']
249
- except Exception as e:
250
- log_error(f"Failed to get available queries for {language}: {e}")
251
- return []
252
-
253
-
254
- def is_language_supported(language: str) -> bool:
255
- """
256
- Check if a programming language is supported.
257
-
258
- Args:
259
- language: Programming language name
260
-
261
- Returns:
262
- True if the language is supported
263
- """
264
- try:
265
- supported_languages = get_supported_languages()
266
- return language.lower() in [lang.lower() for lang in supported_languages]
267
- except Exception as e:
268
- log_error(f"Failed to check language support for {language}: {e}")
269
- return False
270
-
271
-
272
- def detect_language(file_path: Union[str, Path]) -> Optional[str]:
273
- """
274
- Detect programming language from file path.
275
-
276
- Args:
277
- file_path: Path to the file
278
-
279
- Returns:
280
- Detected language name or None
281
- """
282
- try:
283
- engine = get_engine()
284
- # Use language_detector instead of language_registry
285
- return engine.language_detector.detect_from_extension(str(file_path))
286
- except Exception as e:
287
- log_error(f"Failed to detect language for {file_path}: {e}")
288
- return None
289
-
290
-
291
- def get_file_extensions(language: str) -> List[str]:
292
- """
293
- Get file extensions for a specific language.
294
-
295
- Args:
296
- language: Programming language name
297
-
298
- Returns:
299
- List of file extensions
300
- """
301
- try:
302
- engine = get_engine()
303
- # Use language_detector to get extensions
304
- if hasattr(engine.language_detector, 'get_extensions_for_language'):
305
- return engine.language_detector.get_extensions_for_language(language)
306
- else:
307
- # Fallback: return common extensions
308
- extension_map = {
309
- 'java': ['.java'],
310
- 'python': ['.py'],
311
- 'javascript': ['.js'],
312
- 'typescript': ['.ts'],
313
- 'c': ['.c'],
314
- 'cpp': ['.cpp', '.cxx', '.cc'],
315
- 'go': ['.go'],
316
- 'rust': ['.rs']
317
- }
318
- return extension_map.get(language.lower(), [])
319
- except Exception as e:
320
- log_error(f"Failed to get extensions for {language}: {e}")
321
- return []
322
-
323
-
324
- def validate_file(file_path: Union[str, Path]) -> Dict[str, Any]:
325
- """
326
- Validate a source code file without full analysis.
327
-
328
- Args:
329
- file_path: Path to the file to validate
330
-
331
- Returns:
332
- Validation results dictionary
333
- """
334
- file_path = Path(file_path)
335
-
336
- result = {
337
- "valid": False,
338
- "exists": file_path.exists(),
339
- "readable": False,
340
- "language": None,
341
- "supported": False,
342
- "size": 0,
343
- "errors": []
344
- }
345
-
346
- try:
347
- # Check if file exists
348
- if not file_path.exists():
349
- result["errors"].append("File does not exist")
350
- return result
351
-
352
- # Check if file is readable
353
- try:
354
- with open(file_path, 'r', encoding='utf-8') as f:
355
- content = f.read(100) # Read first 100 chars to test
356
- result["readable"] = True
357
- result["size"] = file_path.stat().st_size
358
- except Exception as e:
359
- result["errors"].append(f"File is not readable: {e}")
360
- return result
361
-
362
- # Detect language
363
- language = detect_language(file_path)
364
- result["language"] = language
365
-
366
- if language:
367
- result["supported"] = is_language_supported(language)
368
- if not result["supported"]:
369
- result["errors"].append(f"Language '{language}' is not supported")
370
- else:
371
- result["errors"].append("Could not detect programming language")
372
-
373
- # If we got this far with no errors, the file is valid
374
- result["valid"] = len(result["errors"]) == 0
375
-
376
- except Exception as e:
377
- result["errors"].append(f"Validation failed: {e}")
378
-
379
- return result
380
-
381
-
382
- def get_framework_info() -> Dict[str, Any]:
383
- """
384
- Get information about the framework and its capabilities.
385
-
386
- Returns:
387
- Framework information dictionary
388
- """
389
- try:
390
- engine = get_engine()
391
-
392
- return {
393
- "name": "tree-sitter-analyzer",
394
- "version": "2.0.0", # New architecture version
395
- "supported_languages": engine.get_supported_languages(),
396
- "total_languages": len(engine.get_supported_languages()),
397
- "plugin_info": {
398
- "manager_available": engine.plugin_manager is not None,
399
- "loaded_plugins": len(engine.plugin_manager.get_supported_languages()) if engine.plugin_manager else 0
400
- },
401
- "core_components": [
402
- "AnalysisEngine",
403
- "Parser",
404
- "QueryExecutor",
405
- "PluginManager",
406
- "LanguageDetector"
407
- ]
408
- }
409
- except Exception as e:
410
- log_error(f"Failed to get framework info: {e}")
411
- return {
412
- "name": "tree-sitter-analyzer",
413
- "version": "2.0.0",
414
- "error": str(e)
415
- }
416
-
417
-
418
- def execute_query(
419
- file_path: Union[str, Path],
420
- query_name: str,
421
- language: Optional[str] = None
422
- ) -> Dict[str, Any]:
423
- """
424
- Execute a specific query against a file.
425
-
426
- Args:
427
- file_path: Path to the source file
428
- query_name: Name of the query to execute
429
- language: Programming language (auto-detected if not specified)
430
-
431
- Returns:
432
- Query execution results
433
- """
434
- try:
435
- # Analyze with only the specified query
436
- result = analyze_file(
437
- file_path,
438
- language=language,
439
- queries=[query_name],
440
- include_elements=False,
441
- include_queries=True
442
- )
443
-
444
- if result["success"] and "query_results" in result:
445
- query_results = result["query_results"].get(query_name, [])
446
- return {
447
- "success": True,
448
- "query_name": query_name,
449
- "results": query_results,
450
- "count": len(query_results),
451
- "language": result.get("language_info", {}).get("language"),
452
- "file_path": str(file_path)
453
- }
454
- else:
455
- return {
456
- "success": False,
457
- "query_name": query_name,
458
- "error": result.get("error", "Unknown error"),
459
- "file_path": str(file_path)
460
- }
461
-
462
- except Exception as e:
463
- log_error(f"Query execution failed: {e}")
464
- return {
465
- "success": False,
466
- "query_name": query_name,
467
- "error": str(e),
468
- "file_path": str(file_path)
469
- }
470
-
471
-
472
- def extract_elements(
473
- file_path: Union[str, Path],
474
- language: Optional[str] = None,
475
- element_types: Optional[List[str]] = None
476
- ) -> Dict[str, Any]:
477
- """
478
- Extract code elements from a file.
479
-
480
- Args:
481
- file_path: Path to the source file
482
- language: Programming language (auto-detected if not specified)
483
- element_types: Types of elements to extract (all if not specified)
484
-
485
- Returns:
486
- Element extraction results
487
- """
488
- try:
489
- # Analyze with only element extraction
490
- result = analyze_file(
491
- file_path,
492
- language=language,
493
- include_elements=True,
494
- include_queries=False
495
- )
496
-
497
- if result["success"] and "elements" in result:
498
- elements = result["elements"]
499
-
500
- # Filter by element types if specified
501
- if element_types:
502
- filtered_elements = []
503
- for element in elements:
504
- if any(etype.lower() in element.get("type", "").lower() for etype in element_types):
505
- filtered_elements.append(element)
506
- elements = filtered_elements
507
-
508
- return {
509
- "success": True,
510
- "elements": elements,
511
- "count": len(elements),
512
- "language": result.get("language_info", {}).get("language"),
513
- "file_path": str(file_path)
514
- }
515
- else:
516
- return {
517
- "success": False,
518
- "error": result.get("error", "Unknown error"),
519
- "file_path": str(file_path)
520
- }
521
-
522
- except Exception as e:
523
- log_error(f"Element extraction failed: {e}")
524
- return {
525
- "success": False,
526
- "error": str(e),
527
- "file_path": str(file_path)
528
- }
529
-
530
-
531
- # Convenience functions for backward compatibility
532
- def analyze(file_path: Union[str, Path], **kwargs) -> Dict[str, Any]:
533
- """Convenience function that aliases to analyze_file."""
534
- return analyze_file(file_path, **kwargs)
535
-
536
-
537
- def get_languages() -> List[str]:
538
- """Convenience function that aliases to get_supported_languages."""
539
- return get_supported_languages()
1
+ #!/usr/bin/env python3
2
+ """
3
+ Tree-sitter Analyzer API
4
+
5
+ Public API facade that provides a stable, high-level interface to the
6
+ tree-sitter analyzer framework. This is the main entry point for both
7
+ CLI and MCP interfaces.
8
+ """
9
+
10
+ import logging
11
+ from pathlib import Path
12
+ from typing import Any
13
+
14
+ from .core.engine import AnalysisEngine
15
+ from .utils import log_error
16
+
17
+ logger = logging.getLogger(__name__)
18
+
19
+ # Global engine instance (singleton pattern)
20
+ _engine: AnalysisEngine | None = None
21
+
22
+
23
+ def get_engine() -> AnalysisEngine:
24
+ """
25
+ Get the global analysis engine instance.
26
+
27
+ Returns:
28
+ AnalysisEngine instance
29
+ """
30
+ global _engine
31
+ if _engine is None:
32
+ _engine = AnalysisEngine()
33
+ return _engine
34
+
35
+
36
+ def analyze_file(
37
+ file_path: str | Path,
38
+ language: str | None = None,
39
+ queries: list[str] | None = None,
40
+ include_elements: bool = True,
41
+ include_details: bool = False, # Add for backward compatibility
42
+ include_queries: bool = True,
43
+ include_complexity: bool = False, # Add for backward compatibility
44
+ ) -> dict[str, Any]:
45
+ """
46
+ Analyze a source code file.
47
+
48
+ This is the main high-level function for file analysis. It handles
49
+ language detection, parsing, query execution, and element extraction.
50
+
51
+ Args:
52
+ file_path: Path to the source file to analyze
53
+ language: Programming language (auto-detected if not specified)
54
+ queries: List of query names to execute (all available if not specified)
55
+ include_elements: Whether to extract code elements
56
+ include_queries: Whether to execute queries
57
+ include_complexity: Whether to include complexity metrics (backward compatibility)
58
+
59
+ Returns:
60
+ Analysis results dictionary containing:
61
+ - success: Whether the analysis was successful
62
+ - file_info: Basic file information
63
+ - language_info: Detected/specified language information
64
+ - ast_info: Abstract syntax tree information
65
+ - query_results: Results from executed queries (if include_queries=True)
66
+ - elements: Extracted code elements (if include_elements=True)
67
+ - error: Error message (if success=False)
68
+ """
69
+ try:
70
+ engine = get_engine()
71
+
72
+ # Perform the analysis
73
+ analysis_result = engine.analyze_file(file_path, language)
74
+
75
+ # Convert AnalysisResult to expected API format
76
+ result = {
77
+ "success": analysis_result.success,
78
+ "file_info": {
79
+ "path": str(file_path),
80
+ "exists": Path(file_path).exists(),
81
+ "size": (
82
+ Path(file_path).stat().st_size if Path(file_path).exists() else 0
83
+ ),
84
+ },
85
+ "language_info": {
86
+ "language": analysis_result.language,
87
+ "detected": language is None, # True if language was auto-detected
88
+ },
89
+ "ast_info": {
90
+ "node_count": analysis_result.node_count,
91
+ "line_count": analysis_result.line_count,
92
+ },
93
+ }
94
+
95
+ # Add elements if requested and available
96
+ if include_elements and hasattr(analysis_result, "elements"):
97
+ result["elements"] = [
98
+ {
99
+ "name": elem.name,
100
+ "type": type(elem).__name__.lower(),
101
+ "start_line": elem.start_line,
102
+ "end_line": elem.end_line,
103
+ "raw_text": elem.raw_text,
104
+ "language": elem.language,
105
+ }
106
+ for elem in analysis_result.elements
107
+ ]
108
+
109
+ # Add query results if requested and available
110
+ if include_queries and hasattr(analysis_result, "query_results"):
111
+ result["query_results"] = analysis_result.query_results
112
+
113
+ # Add error message if analysis failed
114
+ if not analysis_result.success and analysis_result.error_message:
115
+ result["error"] = analysis_result.error_message
116
+
117
+ # Filter results based on options
118
+ if not include_elements and "elements" in result:
119
+ del result["elements"]
120
+
121
+ if not include_queries and "query_results" in result:
122
+ del result["query_results"]
123
+
124
+ return result
125
+
126
+ except FileNotFoundError as e:
127
+ # Re-raise FileNotFoundError for tests that expect it
128
+ raise e
129
+ except Exception as e:
130
+ log_error(f"API analyze_file failed: {e}")
131
+ return {
132
+ "success": False,
133
+ "error": str(e),
134
+ "file_info": {"path": str(file_path), "exists": Path(file_path).exists()},
135
+ }
136
+
137
+
138
+ def analyze_code(
139
+ source_code: str,
140
+ language: str,
141
+ queries: list[str] | None = None,
142
+ include_elements: bool = True,
143
+ include_queries: bool = True,
144
+ ) -> dict[str, Any]:
145
+ """
146
+ Analyze source code directly (without file).
147
+
148
+ Args:
149
+ source_code: Source code string to analyze
150
+ language: Programming language
151
+ queries: List of query names to execute (all available if not specified)
152
+ include_elements: Whether to extract code elements
153
+ include_queries: Whether to execute queries
154
+
155
+ Returns:
156
+ Analysis results dictionary
157
+ """
158
+ try:
159
+ engine = get_engine()
160
+
161
+ # Perform the analysis
162
+ analysis_result = engine.analyze_code(source_code, language)
163
+
164
+ # Convert AnalysisResult to expected API format
165
+ result = {
166
+ "success": analysis_result.success,
167
+ "language_info": {
168
+ "language": analysis_result.language,
169
+ "detected": False, # Language was explicitly provided
170
+ },
171
+ "ast_info": {
172
+ "node_count": analysis_result.node_count,
173
+ "line_count": analysis_result.line_count,
174
+ },
175
+ }
176
+
177
+ # Add elements if requested and available
178
+ if include_elements and hasattr(analysis_result, "elements"):
179
+ result["elements"] = [
180
+ {
181
+ "name": elem.name,
182
+ "type": type(elem).__name__.lower(),
183
+ "start_line": elem.start_line,
184
+ "end_line": elem.end_line,
185
+ "raw_text": elem.raw_text,
186
+ "language": elem.language,
187
+ }
188
+ for elem in analysis_result.elements
189
+ ]
190
+
191
+ # Add query results if requested and available
192
+ if include_queries and hasattr(analysis_result, "query_results"):
193
+ result["query_results"] = analysis_result.query_results
194
+
195
+ # Add error message if analysis failed
196
+ if not analysis_result.success and analysis_result.error_message:
197
+ result["error"] = analysis_result.error_message
198
+
199
+ # Filter results based on options
200
+ if not include_elements and "elements" in result:
201
+ del result["elements"]
202
+
203
+ if not include_queries and "query_results" in result:
204
+ del result["query_results"]
205
+
206
+ return result
207
+
208
+ except Exception as e:
209
+ log_error(f"API analyze_code failed: {e}")
210
+ return {"success": False, "error": str(e)}
211
+
212
+
213
+ def get_supported_languages() -> list[str]:
214
+ """
215
+ Get list of all supported programming languages.
216
+
217
+ Returns:
218
+ List of supported language names
219
+ """
220
+ try:
221
+ engine = get_engine()
222
+ return engine.get_supported_languages()
223
+ except Exception as e:
224
+ log_error(f"Failed to get supported languages: {e}")
225
+ return []
226
+
227
+
228
+ def get_available_queries(language: str) -> list[str]:
229
+ """
230
+ Get available queries for a specific language.
231
+
232
+ Args:
233
+ language: Programming language name
234
+
235
+ Returns:
236
+ List of available query names
237
+ """
238
+ try:
239
+ engine = get_engine()
240
+ # Try to get plugin and its supported queries
241
+ plugin = engine._get_language_plugin(language)
242
+ if plugin and hasattr(plugin, "get_supported_queries"):
243
+ result = plugin.get_supported_queries()
244
+ return list(result) if result else []
245
+ else:
246
+ # Return default queries
247
+ return ["class", "method", "field"]
248
+ except Exception as e:
249
+ log_error(f"Failed to get available queries for {language}: {e}")
250
+ return []
251
+
252
+
253
+ def is_language_supported(language: str) -> bool:
254
+ """
255
+ Check if a programming language is supported.
256
+
257
+ Args:
258
+ language: Programming language name
259
+
260
+ Returns:
261
+ True if the language is supported
262
+ """
263
+ try:
264
+ supported_languages = get_supported_languages()
265
+ return language.lower() in [lang.lower() for lang in supported_languages]
266
+ except Exception as e:
267
+ log_error(f"Failed to check language support for {language}: {e}")
268
+ return False
269
+
270
+
271
+ def detect_language(file_path: str | Path) -> str | None:
272
+ """
273
+ Detect programming language from file path.
274
+
275
+ Args:
276
+ file_path: Path to the file
277
+
278
+ Returns:
279
+ Detected language name or None
280
+ """
281
+ try:
282
+ engine = get_engine()
283
+ # Use language_detector instead of language_registry
284
+ return engine.language_detector.detect_from_extension(str(file_path))
285
+ except Exception as e:
286
+ log_error(f"Failed to detect language for {file_path}: {e}")
287
+ return None
288
+
289
+
290
+ def get_file_extensions(language: str) -> list[str]:
291
+ """
292
+ Get file extensions for a specific language.
293
+
294
+ Args:
295
+ language: Programming language name
296
+
297
+ Returns:
298
+ List of file extensions
299
+ """
300
+ try:
301
+ engine = get_engine()
302
+ # Use language_detector to get extensions
303
+ if hasattr(engine.language_detector, "get_extensions_for_language"):
304
+ result = engine.language_detector.get_extensions_for_language(language)
305
+ return list(result) if result else []
306
+ else:
307
+ # Fallback: return common extensions
308
+ extension_map = {
309
+ "java": [".java"],
310
+ "python": [".py"],
311
+ "javascript": [".js"],
312
+ "typescript": [".ts"],
313
+ "c": [".c"],
314
+ "cpp": [".cpp", ".cxx", ".cc"],
315
+ "go": [".go"],
316
+ "rust": [".rs"],
317
+ }
318
+ return extension_map.get(language.lower(), [])
319
+ except Exception as e:
320
+ log_error(f"Failed to get extensions for {language}: {e}")
321
+ return []
322
+
323
+
324
+ def validate_file(file_path: str | Path) -> dict[str, Any]:
325
+ """
326
+ Validate a source code file without full analysis.
327
+
328
+ Args:
329
+ file_path: Path to the file to validate
330
+
331
+ Returns:
332
+ Validation results dictionary
333
+ """
334
+ file_path = Path(file_path)
335
+
336
+ result: dict[str, Any] = {
337
+ "valid": False,
338
+ "exists": file_path.exists(),
339
+ "readable": False,
340
+ "language": None,
341
+ "supported": False,
342
+ "size": 0,
343
+ "errors": [],
344
+ }
345
+
346
+ try:
347
+ # Check if file exists
348
+ if not file_path.exists():
349
+ result["errors"].append("File does not exist")
350
+ return result
351
+
352
+ # Check if file is readable
353
+ try:
354
+ with open(file_path, encoding="utf-8") as f:
355
+ f.read(100) # Read first 100 chars to test
356
+ result["readable"] = True
357
+ result["size"] = file_path.stat().st_size
358
+ except Exception as e:
359
+ result["errors"].append(f"File is not readable: {e}")
360
+ return result
361
+
362
+ # Detect language
363
+ language = detect_language(file_path)
364
+ result["language"] = language
365
+
366
+ if language:
367
+ result["supported"] = is_language_supported(language)
368
+ if not result["supported"]:
369
+ result["errors"].append(f"Language '{language}' is not supported")
370
+ else:
371
+ result["errors"].append("Could not detect programming language")
372
+
373
+ # If we got this far with no errors, the file is valid
374
+ result["valid"] = len(result["errors"]) == 0
375
+
376
+ except Exception as e:
377
+ result["errors"].append(f"Validation failed: {e}")
378
+
379
+ return result
380
+
381
+
382
+ def get_framework_info() -> dict[str, Any]:
383
+ """
384
+ Get information about the framework and its capabilities.
385
+
386
+ Returns:
387
+ Framework information dictionary
388
+ """
389
+ try:
390
+ engine = get_engine()
391
+
392
+ return {
393
+ "name": "tree-sitter-analyzer",
394
+ "version": "2.0.0", # New architecture version
395
+ "supported_languages": engine.get_supported_languages(),
396
+ "total_languages": len(engine.get_supported_languages()),
397
+ "plugin_info": {
398
+ "manager_available": engine.plugin_manager is not None,
399
+ "loaded_plugins": (
400
+ len(engine.plugin_manager.get_supported_languages())
401
+ if engine.plugin_manager
402
+ else 0
403
+ ),
404
+ },
405
+ "core_components": [
406
+ "AnalysisEngine",
407
+ "Parser",
408
+ "QueryExecutor",
409
+ "PluginManager",
410
+ "LanguageDetector",
411
+ ],
412
+ }
413
+ except Exception as e:
414
+ log_error(f"Failed to get framework info: {e}")
415
+ return {"name": "tree-sitter-analyzer", "version": "2.0.0", "error": str(e)}
416
+
417
+
418
+ def execute_query(
419
+ file_path: str | Path, query_name: str, language: str | None = None
420
+ ) -> dict[str, Any]:
421
+ """
422
+ Execute a specific query against a file.
423
+
424
+ Args:
425
+ file_path: Path to the source file
426
+ query_name: Name of the query to execute
427
+ language: Programming language (auto-detected if not specified)
428
+
429
+ Returns:
430
+ Query execution results
431
+ """
432
+ try:
433
+ # Analyze with only the specified query
434
+ result = analyze_file(
435
+ file_path,
436
+ language=language,
437
+ queries=[query_name],
438
+ include_elements=False,
439
+ include_queries=True,
440
+ )
441
+
442
+ if result["success"] and "query_results" in result:
443
+ query_results = result["query_results"].get(query_name, [])
444
+ return {
445
+ "success": True,
446
+ "query_name": query_name,
447
+ "results": query_results,
448
+ "count": len(query_results),
449
+ "language": result.get("language_info", {}).get("language"),
450
+ "file_path": str(file_path),
451
+ }
452
+ else:
453
+ return {
454
+ "success": False,
455
+ "query_name": query_name,
456
+ "error": result.get("error", "Unknown error"),
457
+ "file_path": str(file_path),
458
+ }
459
+
460
+ except Exception as e:
461
+ log_error(f"Query execution failed: {e}")
462
+ return {
463
+ "success": False,
464
+ "query_name": query_name,
465
+ "error": str(e),
466
+ "file_path": str(file_path),
467
+ }
468
+
469
+
470
+ def extract_elements(
471
+ file_path: str | Path,
472
+ language: str | None = None,
473
+ element_types: list[str] | None = None,
474
+ ) -> dict[str, Any]:
475
+ """
476
+ Extract code elements from a file.
477
+
478
+ Args:
479
+ file_path: Path to the source file
480
+ language: Programming language (auto-detected if not specified)
481
+ element_types: Types of elements to extract (all if not specified)
482
+
483
+ Returns:
484
+ Element extraction results
485
+ """
486
+ try:
487
+ # Analyze with only element extraction
488
+ result = analyze_file(
489
+ file_path, language=language, include_elements=True, include_queries=False
490
+ )
491
+
492
+ if result["success"] and "elements" in result:
493
+ elements = result["elements"]
494
+
495
+ # Filter by element types if specified
496
+ if element_types:
497
+ filtered_elements = []
498
+ for element in elements:
499
+ if any(
500
+ etype.lower() in element.get("type", "").lower()
501
+ for etype in element_types
502
+ ):
503
+ filtered_elements.append(element)
504
+ elements = filtered_elements
505
+
506
+ return {
507
+ "success": True,
508
+ "elements": elements,
509
+ "count": len(elements),
510
+ "language": result.get("language_info", {}).get("language"),
511
+ "file_path": str(file_path),
512
+ }
513
+ else:
514
+ return {
515
+ "success": False,
516
+ "error": result.get("error", "Unknown error"),
517
+ "file_path": str(file_path),
518
+ }
519
+
520
+ except Exception as e:
521
+ log_error(f"Element extraction failed: {e}")
522
+ return {"success": False, "error": str(e), "file_path": str(file_path)}
523
+
524
+
525
+ # Convenience functions for backward compatibility
526
+ def analyze(file_path: str | Path, **kwargs: Any) -> dict[str, Any]:
527
+ """Convenience function that aliases to analyze_file."""
528
+ return analyze_file(file_path, **kwargs)
529
+
530
+
531
+ def get_languages() -> list[str]:
532
+ """Convenience function that aliases to get_supported_languages."""
533
+ return get_supported_languages()