PyPI - code2llm - Versions diffs - 0.3.7__py3-none-any.whl - Mend

code2llm 0.3.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

code2flow/__init__.py +47 -0
code2flow/__main__.py +6 -0
code2flow/analysis/__init__.py +23 -0
code2flow/analysis/call_graph.py +210 -0
code2flow/analysis/cfg.py +293 -0
code2flow/analysis/coupling.py +77 -0
code2flow/analysis/data_analysis.py +249 -0
code2flow/analysis/dfg.py +224 -0
code2flow/analysis/pipeline_detector.py +445 -0
code2flow/analysis/side_effects.py +313 -0
code2flow/analysis/smells.py +192 -0
code2flow/analysis/type_inference.py +306 -0
code2flow/cli.py +493 -0
code2flow/core/__init__.py +36 -0
code2flow/core/analyzer.py +765 -0
code2flow/core/config.py +177 -0
code2flow/core/models.py +194 -0
code2flow/core/streaming_analyzer.py +666 -0
code2flow/exporters/__init__.py +35 -0
code2flow/exporters/base.py +13 -0
code2flow/exporters/context_exporter.py +207 -0
code2flow/exporters/flow_exporter.py +570 -0
code2flow/exporters/json_exporter.py +17 -0
code2flow/exporters/llm_exporter.py +12 -0
code2flow/exporters/map_exporter.py +218 -0
code2flow/exporters/mermaid_exporter.py +67 -0
code2flow/exporters/toon.py +982 -0
code2flow/exporters/yaml_exporter.py +108 -0
code2flow/llm_flow_generator.py +451 -0
code2flow/llm_task_generator.py +263 -0
code2flow/mermaid_generator.py +481 -0
code2flow/nlp/__init__.py +23 -0
code2flow/nlp/config.py +174 -0
code2flow/nlp/entity_resolution.py +326 -0
code2flow/nlp/intent_matching.py +297 -0
code2flow/nlp/normalization.py +122 -0
code2flow/nlp/pipeline.py +388 -0
code2flow/patterns/__init__.py +0 -0
code2flow/patterns/detector.py +168 -0
code2flow/refactor/__init__.py +0 -0
code2flow/refactor/prompt_engine.py +150 -0
code2flow/visualizers/__init__.py +0 -0
code2flow/visualizers/graph.py +196 -0
code2llm-0.3.7.dist-info/METADATA +604 -0
code2llm-0.3.7.dist-info/RECORD +49 -0
code2llm-0.3.7.dist-info/WHEEL +5 -0
code2llm-0.3.7.dist-info/entry_points.txt +2 -0
code2llm-0.3.7.dist-info/licenses/LICENSE +201 -0
code2llm-0.3.7.dist-info/top_level.txt +1 -0

code2flow/cli.py ADDED Viewed

@@ -0,0 +1,493 @@
+#!/usr/bin/env python3
+"""
+code2flow - CLI for Python code flow analysis
+Analyze control flow, data flow, and call graphs of Python codebases.
+"""
+import argparse
+import sys
+from pathlib import Path
+from .core.config import Config, ANALYSIS_MODES
+from .core.analyzer import ProjectAnalyzer
+from .exporters import (
+    YAMLExporter, JSONExporter, MermaidExporter,
+    ContextExporter, LLMPromptExporter,
+    ToonExporter, MapExporter, FlowExporter,
+)
+from .visualizers.graph import GraphVisualizer
+def create_parser() -> argparse.ArgumentParser:
+    """Create CLI argument parser."""
+    parser = argparse.ArgumentParser(
+        prog='code2flow',
+        description='Analyze Python code control flow, data flow, and call graphs',
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog='''
+Examples:
+  code2flow /path/to/project                    # Default: TOON format only
+  code2flow /path/to/project -f all             # Generate all formats
+  code2flow /path/to/project -f toon,map,flow   # Diagnostics + structure + data-flow
+  code2flow /path/to/project -f context         # LLM narrative context
+  code2flow /path/to/project -m static -o ./analysis
+  code2flow llm-flow                             # Generate LLM flow summary
+Format Options:
+  toon    - Health diagnostics (analysis.toon) — default
+  map     - Structural map (map.toon) — modules, imports, signatures
+  flow    - Data-flow analysis (flow.toon) — pipelines, contracts, types
+  context - LLM narrative (context.md) — architecture summary
+  yaml    - Standard YAML format
+  json    - Machine-readable JSON
+  mermaid - Flowchart diagrams
+  png     - Visual graphs
+  all     - Generate all formats
+        '''
+    )
+    # Add backward compatibility source argument first
+    parser.add_argument(
+        'source',
+        nargs='?',
+        help='Path to Python source file or directory'
+    )
+    parser.add_argument(
+        '-m', '--mode',
+        choices=list(ANALYSIS_MODES.keys()),
+        default='hybrid',
+        help=f'Analysis mode (default: hybrid)'
+    )
+    parser.add_argument(
+        '-o', '--output',
+        default='./code2flow_output',
+        help='Output directory (default: ./code2flow_output)'
+    )
+    parser.add_argument(
+        '-f', '--format',
+        default='toon',
+        help='Output formats: toon,map,flow,context,yaml,json,mermaid,png,all (default: toon)'
+    )
+    parser.add_argument(
+        '--full',
+        action='store_true',
+        help='Include all fields in output (including empty/null values)'
+    )
+    parser.add_argument(
+        '--no-patterns',
+        action='store_true',
+        help='Disable pattern detection'
+    )
+    parser.add_argument(
+        '--max-depth',
+        type=int,
+        default=10,
+        help='Maximum analysis depth (default: 10)'
+    )
+    parser.add_argument(
+        '-v', '--verbose',
+        action='store_true',
+        help='Verbose output'
+    )
+    parser.add_argument(
+        '--no-png',
+        action='store_true',
+        help='Skip automatic PNG generation from Mermaid files'
+    )
+    parser.add_argument(
+        '--strategy',
+        choices=['quick', 'standard', 'deep'],
+        default='standard',
+        help='Analysis strategy: quick (fast overview), standard (balanced), deep (complete)'
+    )
+    parser.add_argument(
+        '--streaming',
+        action='store_true',
+        help='Use streaming analysis with progress reporting'
+    )
+    parser.add_argument(
+        '--incremental',
+        action='store_true',
+        help='Only analyze changed files (requires previous run)'
+    )
+    parser.add_argument(
+        '--max-memory',
+        type=int,
+        default=1000,
+        help='Max memory in MB (default: 1000)'
+    )
+    parser.add_argument(
+        '--split-output',
+        action='store_true',
+        help='Split YAML output into multiple files (summary, functions, classes, modules, entry_points)'
+    )
+    parser.add_argument(
+        '--separate-orphans',
+        action='store_true',
+        help='Separate consolidated project from orphaned/isolated functions into different folders'
+    )
+    parser.add_argument(
+        '--data-flow',
+        action='store_true',
+        help='Export data flow analysis (pipelines, state patterns, dependencies, events)'
+    )
+    parser.add_argument(
+        '--data-structures',
+        action='store_true',
+        help='Export data structure analysis (types, flows, optimization opportunities)'
+    )
+    parser.add_argument(
+        '--refactor',
+        action='store_true',
+        help='Enable AI-driven refactoring analysis and prompt generation'
+    )
+    parser.add_argument(
+        '--smell',
+        help='Filter refactoring by specific code smell (e.g., god_function, feature_envy)'
+    )
+    parser.add_argument(
+        '--llm-format',
+        choices=['claude', 'gpt', 'markdown'],
+        default='markdown',
+        help='Format for refactoring prompts (default: markdown)'
+    )
+    return parser
+def main():
+    """Main CLI entry point."""
+    # Handle special cases first
+    if len(sys.argv) > 1 and sys.argv[1] == 'llm-flow':
+        from .llm_flow_generator import main as llm_flow_main
+        return llm_flow_main(sys.argv[2:])
+    if len(sys.argv) > 1 and sys.argv[1] == 'llm-context':
+        # Quick LLM context generation
+        return generate_llm_context(sys.argv[2:])
+    # For all other cases, use the regular parser
+    parser = create_parser()
+    args = parser.parse_args()
+    # Handle analysis (default behavior)
+    if not args.source:
+        print("Error: missing required argument: source", file=sys.stderr)
+        print("Usage: code2flow <source> [options]", file=sys.stderr)
+        print("   or: code2flow llm-flow [options]", file=sys.stderr)
+        sys.exit(2)
+    # Validate source path
+    source_path = Path(args.source)
+    if not source_path.exists():
+        print(f"Error: Source path not found: {source_path}", file=sys.stderr)
+        sys.exit(1)
+    # Create output directory
+    output_dir = Path(args.output)
+    output_dir.mkdir(parents=True, exist_ok=True)
+    # Configure analysis
+    config = Config(
+        mode=args.mode,
+        max_depth_enumeration=args.max_depth,
+        detect_state_machines=not args.no_patterns,
+        detect_recursion=not args.no_patterns,
+        output_dir=str(output_dir)
+    )
+    if args.verbose:
+        print(f"Analyzing: {source_path}")
+        print(f"Mode: {args.mode}")
+        print(f"Output: {output_dir}")
+    # Run analysis
+    try:
+        if args.streaming or args.strategy in ['quick', 'deep']:
+            # Use optimized streaming analyzer
+            from .core.streaming_analyzer import (
+                StreamingAnalyzer, STRATEGY_QUICK,
+                STRATEGY_STANDARD, STRATEGY_DEEP
+            )
+            strategy_map = {
+                'quick': STRATEGY_QUICK,
+                'standard': STRATEGY_STANDARD,
+                'deep': STRATEGY_DEEP
+            }
+            strategy = strategy_map.get(args.strategy, STRATEGY_STANDARD)
+            # Adjust strategy for memory limit
+            strategy.max_files_in_memory = min(
+                strategy.max_files_in_memory,
+                args.max_memory // 10  # Rough heuristic
+            )
+            analyzer = StreamingAnalyzer(config, strategy)
+            if args.verbose:
+                def on_progress(update):
+                    pct = update.get('percentage', 0)
+                    print(f"\r[{pct:.0f}%] {update.get('message', '')}", end='', flush=True)
+                analyzer.set_progress_callback(on_progress)
+            # Collect results
+            functions = {}
+            classes = {}
+            nodes = {}
+            edges = []
+            print(f"Analyzing with {args.strategy} strategy...")
+            for update in analyzer.analyze_streaming(str(source_path)):
+                if update['type'] == 'file_complete':
+                    # Result is yielded but we need to re-analyze for full data
+                    pass
+                elif update['type'] == 'complete':
+                    if args.verbose:
+                        print()  # New line after progress
+                    print(f"Completed in {update.get('elapsed_seconds', 0):.1f}s")
+            # For streaming, we need to run again to get actual results
+            # TODO: Modify streaming to accumulate results properly
+            analyzer = ProjectAnalyzer(config)
+            result = analyzer.analyze_project(str(source_path))
+        else:
+            # Use standard analyzer
+            analyzer = ProjectAnalyzer(config)
+            result = analyzer.analyze_project(str(source_path))
+        if args.verbose:
+            print(f"\nAnalysis complete:")
+            print(f"  - Functions: {len(result.functions)}")
+            print(f"  - Classes: {len(result.classes)}")
+            print(f"  - CFG nodes: {len(result.nodes)}")
+            print(f"  - CFG edges: {len(result.edges)}")
+    except Exception as e:
+        print(f"Error during analysis: {e}", file=sys.stderr)
+        sys.exit(1)
+    # Export results
+    formats = [f.strip() for f in args.format.split(',')]
+    # Handle 'all' format
+    if 'all' in formats:
+        formats = ['toon', 'map', 'flow', 'context', 'yaml', 'json', 'mermaid', 'png']
+    try:
+        if 'toon' in formats:
+            exporter = ToonExporter()
+            filepath = output_dir / 'analysis.toon'
+            exporter.export(result, str(filepath))
+            if args.verbose:
+                print(f"  - TOON (diagnostics): {filepath}")
+        if 'map' in formats:
+            exporter = MapExporter()
+            filepath = output_dir / 'map.toon'
+            exporter.export(result, str(filepath))
+            if args.verbose:
+                print(f"  - MAP (structure): {filepath}")
+        if 'flow' in formats:
+            exporter = FlowExporter()
+            filepath = output_dir / 'flow.toon'
+            exporter.export(result, str(filepath))
+            if args.verbose:
+                print(f"  - FLOW (data-flow): {filepath}")
+        if 'context' in formats:
+            exporter = ContextExporter()
+            filepath = output_dir / 'context.md'
+            exporter.export(result, str(filepath))
+            if args.verbose:
+                print(f"  - CONTEXT (LLM narrative): {filepath}")
+        if 'yaml' in formats:
+            exporter = YAMLExporter()
+            if args.separate_orphans:
+                # Create separated output (consolidated vs orphans)
+                sep_dir = output_dir / 'separated'
+                exporter.export_separated(result, str(sep_dir), compact=True)
+                if args.verbose:
+                    print(f"  - YAML (separated): {sep_dir}/")
+            elif args.split_output:
+                # Create split output for large projects
+                split_dir = output_dir / 'split'
+                exporter.export_split(result, str(split_dir), include_defaults=args.full)
+                if args.verbose:
+                    print(f"  - YAML (split): {split_dir}/")
+            else:
+                filepath = output_dir / 'analysis.yaml'
+                exporter.export(result, str(filepath), include_defaults=args.full)
+                if args.verbose:
+                    print(f"  - YAML: {filepath}")
+        if 'json' in formats:
+            exporter = JSONExporter()
+            filepath = output_dir / 'analysis.json'
+            exporter.export(result, str(filepath), include_defaults=args.full)
+            if args.verbose:
+                print(f"  - JSON: {filepath}")
+        if 'mermaid' in formats:
+            exporter = MermaidExporter()
+            filepath = output_dir / 'flow.mmd'
+            exporter.export(result, str(filepath))
+            filepath = output_dir / 'calls.mmd'
+            exporter.export_call_graph(result, str(filepath))
+            filepath = output_dir / 'compact_flow.mmd'
+            exporter.export_compact(result, str(filepath))
+            if args.verbose:
+                print(f"  - Mermaid: {output_dir / '*.mmd'}")
+            # Auto-generate PNG from Mermaid files (unless disabled)
+            if not args.no_png:
+                try:
+                    from .mermaid_generator import generate_pngs
+                    png_count = generate_pngs(output_dir, output_dir)
+                    if args.verbose and png_count > 0:
+                        print(f"  - PNG: {png_count} files generated")
+                except ImportError:
+                    # Fallback to external script
+                    try:
+                        import subprocess
+                        script_path = Path(__file__).parent.parent / 'mermaid_to_png.py'
+                        if script_path.exists():
+                            result = subprocess.run([
+                                'python', str(script_path),
+                                '--batch', str(output_dir), str(output_dir)
+                            ], capture_output=True, text=True, timeout=60)
+                            if result.returncode == 0 and args.verbose:
+                                print(f"  - PNG: {output_dir / '*.png'}")
+                    except Exception as png_error:
+                        if args.verbose:
+                            print(f"  - PNG: Skipped (install with: make install-mermaid)")
+            elif args.verbose:
+                print(f"  - PNG: Skipped (--no-png)")
+        if 'png' in formats:
+            visualizer = GraphVisualizer(result)
+            filepath = output_dir / 'cfg.png'
+            visualizer.visualize_cfg(str(filepath))
+            filepath = output_dir / 'call_graph.png'
+            visualizer.visualize_call_graph(str(filepath))
+            if args.verbose:
+                print(f"  - PNG: {output_dir / '*.png'}")
+        if args.data_structures:
+            exporter = YAMLExporter()
+            struct_path = output_dir / 'data_structures.yaml'
+            exporter.export_data_structures(result, str(struct_path), compact=True)
+            if args.verbose:
+                print(f"  - Data structures: {struct_path}")
+        # Generate LLM context (backward compat: always generate context.md)
+        if 'context' not in formats:
+            exporter = ContextExporter()
+            filepath = output_dir / 'context.md'
+            exporter.export(result, str(filepath))
+            if args.verbose:
+                print(f"  - CONTEXT (LLM narrative): {filepath}")
+        # New: AI-driven refactoring prompts
+        if args.refactor:
+            from .refactor.prompt_engine import PromptEngine
+            prompt_engine = PromptEngine(result)
+            prompts = prompt_engine.generate_prompts()
+            if prompts:
+                prompts_dir = output_dir / 'prompts'
+                prompts_dir.mkdir(parents=True, exist_ok=True)
+                # Filter by smell if requested
+                if args.smell:
+                    prompts = {k: v for k, v in prompts.items() if args.smell in k.lower()}
+                for filename, content in prompts.items():
+                    prompt_path = prompts_dir / filename
+                    prompt_path.write_text(content)
+                if args.verbose:
+                    print(f"  - Refactoring prompts: {prompts_dir}/ ({len(prompts)} files)")
+            else:
+                if args.verbose:
+                    print("  - Refactoring: No code smells detected.")
+    except Exception as e:
+        print(f"Error during export: {e}", file=sys.stderr)
+        sys.exit(1)
+    if args.verbose:
+        print(f"\nAll outputs saved to: {output_dir}")
+    return 0
+def generate_llm_context(args_list):
+    """Quick command to generate LLM context only."""
+    import argparse
+    parser = argparse.ArgumentParser(
+        prog='code2flow llm-context',
+        description='Generate LLM-friendly context for a project'
+    )
+    parser.add_argument('source', help='Path to Python project')
+    parser.add_argument('-o', '--output', default='./llm_context.md', help='Output file path')
+    parser.add_argument('-v', '--verbose', action='store_true', help='Verbose output')
+    args = parser.parse_args(args_list)
+    from pathlib import Path
+    from . import ProjectAnalyzer, FAST_CONFIG
+    from .exporters import ContextExporter
+    source_path = Path(args.source)
+    if not source_path.exists():
+        print(f"Error: Source path not found: {source_path}", file=sys.stderr)
+        return 1
+    if args.verbose:
+        print(f"Generating LLM context for: {source_path}")
+    # Use fast config with parallel disabled for stability
+    FAST_CONFIG.performance.parallel_enabled = False
+    analyzer = ProjectAnalyzer(FAST_CONFIG)
+    result = analyzer.analyze_project(str(source_path))
+    exporter = ContextExporter()
+    exporter.export(result, args.output)
+    # Print summary
+    print(f"\n✓ LLM context generated: {args.output}")
+    print(f"  Functions: {len(result.functions)}")
+    print(f"  Classes: {len(result.classes)}")
+    print(f"  Modules: {len(result.modules)}")
+    return 0
+if __name__ == '__main__':
+    sys.exit(main())

code2flow/core/__init__.py ADDED Viewed

@@ -0,0 +1,36 @@
+"""Core analysis components for code2flow."""
+from .analyzer import ProjectAnalyzer, FileCache, FastFileFilter
+from .streaming_analyzer import (
+    StreamingAnalyzer,
+    IncrementalAnalyzer,
+    ScanStrategy,
+    SmartPrioritizer,
+    STRATEGY_QUICK,
+    STRATEGY_STANDARD,
+    STRATEGY_DEEP
+)
+from .config import Config, FAST_CONFIG, PerformanceConfig, FilterConfig
+from .models import (
+    AnalysisResult, FlowNode, FlowEdge,
+    FunctionInfo, ClassInfo, ModuleInfo, Pattern
+)
+__all__ = [
+    'ProjectAnalyzer',
+    'StreamingAnalyzer',
+    'IncrementalAnalyzer',
+    'ScanStrategy',
+    'SmartPrioritizer',
+    'STRATEGY_QUICK',
+    'STRATEGY_STANDARD',
+    'STRATEGY_DEEP',
+    'FileCache',
+    'FastFileFilter',
+    'Config',
+    'FAST_CONFIG',
+    'AnalysisResult',
+    'FunctionInfo',
+    'ClassInfo',
+    'ModuleInfo',
+]