PyPI - codeboarding - Versions diffs - 0.9.0__py3-none-any.whl - Mend

codeboarding 0.9.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (126) hide show

agents/__init__.py +0 -0
agents/abstraction_agent.py +150 -0
agents/agent.py +467 -0
agents/agent_responses.py +363 -0
agents/cluster_methods_mixin.py +281 -0
agents/constants.py +13 -0
agents/dependency_discovery.py +159 -0
agents/details_agent.py +174 -0
agents/llm_config.py +309 -0
agents/meta_agent.py +105 -0
agents/planner_agent.py +105 -0
agents/prompts/__init__.py +85 -0
agents/prompts/abstract_prompt_factory.py +63 -0
agents/prompts/claude_prompts.py +381 -0
agents/prompts/deepseek_prompts.py +389 -0
agents/prompts/gemini_flash_prompts.py +362 -0
agents/prompts/glm_prompts.py +407 -0
agents/prompts/gpt_prompts.py +470 -0
agents/prompts/kimi_prompts.py +400 -0
agents/prompts/prompt_factory.py +179 -0
agents/tools/__init__.py +8 -0
agents/tools/base.py +96 -0
agents/tools/get_external_deps.py +47 -0
agents/tools/get_method_invocations.py +47 -0
agents/tools/read_cfg.py +60 -0
agents/tools/read_docs.py +132 -0
agents/tools/read_file.py +90 -0
agents/tools/read_file_structure.py +156 -0
agents/tools/read_git_diff.py +131 -0
agents/tools/read_packages.py +60 -0
agents/tools/read_source.py +105 -0
agents/tools/read_structure.py +49 -0
agents/tools/toolkit.py +119 -0
agents/validation.py +383 -0
caching/__init__.py +4 -0
caching/cache.py +29 -0
caching/meta_cache.py +227 -0
codeboarding-0.9.0.dist-info/METADATA +223 -0
codeboarding-0.9.0.dist-info/RECORD +126 -0
codeboarding-0.9.0.dist-info/WHEEL +5 -0
codeboarding-0.9.0.dist-info/entry_points.txt +3 -0
codeboarding-0.9.0.dist-info/licenses/LICENSE +21 -0
codeboarding-0.9.0.dist-info/top_level.txt +18 -0
core/__init__.py +101 -0
core/plugin_loader.py +46 -0
core/protocols.py +27 -0
core/registry.py +46 -0
diagram_analysis/__init__.py +4 -0
diagram_analysis/analysis_json.py +346 -0
diagram_analysis/diagram_generator.py +486 -0
diagram_analysis/file_coverage.py +212 -0
diagram_analysis/incremental/__init__.py +63 -0
diagram_analysis/incremental/component_checker.py +236 -0
diagram_analysis/incremental/file_manager.py +217 -0
diagram_analysis/incremental/impact_analyzer.py +238 -0
diagram_analysis/incremental/io_utils.py +281 -0
diagram_analysis/incremental/models.py +72 -0
diagram_analysis/incremental/path_patching.py +164 -0
diagram_analysis/incremental/reexpansion.py +166 -0
diagram_analysis/incremental/scoped_analysis.py +227 -0
diagram_analysis/incremental/updater.py +464 -0
diagram_analysis/incremental/validation.py +48 -0
diagram_analysis/manifest.py +152 -0
diagram_analysis/version.py +6 -0
duckdb_crud.py +125 -0
github_action.py +172 -0
health/__init__.py +3 -0
health/checks/__init__.py +11 -0
health/checks/circular_deps.py +48 -0
health/checks/cohesion.py +93 -0
health/checks/coupling.py +140 -0
health/checks/function_size.py +85 -0
health/checks/god_class.py +167 -0
health/checks/inheritance.py +104 -0
health/checks/instability.py +77 -0
health/checks/unused_code_diagnostics.py +338 -0
health/config.py +172 -0
health/constants.py +19 -0
health/models.py +186 -0
health/runner.py +236 -0
install.py +518 -0
logging_config.py +105 -0
main.py +529 -0
monitoring/__init__.py +12 -0
monitoring/callbacks.py +163 -0
monitoring/context.py +158 -0
monitoring/mixin.py +16 -0
monitoring/paths.py +47 -0
monitoring/stats.py +50 -0
monitoring/writers.py +172 -0
output_generators/__init__.py +0 -0
output_generators/html.py +163 -0
output_generators/html_template.py +382 -0
output_generators/markdown.py +140 -0
output_generators/mdx.py +171 -0
output_generators/sphinx.py +175 -0
repo_utils/__init__.py +277 -0
repo_utils/change_detector.py +289 -0
repo_utils/errors.py +6 -0
repo_utils/git_diff.py +74 -0
repo_utils/ignore.py +341 -0
static_analyzer/__init__.py +335 -0
static_analyzer/analysis_cache.py +699 -0
static_analyzer/analysis_result.py +269 -0
static_analyzer/cluster_change_analyzer.py +391 -0
static_analyzer/cluster_helpers.py +79 -0
static_analyzer/constants.py +166 -0
static_analyzer/git_diff_analyzer.py +224 -0
static_analyzer/graph.py +746 -0
static_analyzer/incremental_orchestrator.py +671 -0
static_analyzer/java_config_scanner.py +232 -0
static_analyzer/java_utils.py +227 -0
static_analyzer/lsp_client/__init__.py +12 -0
static_analyzer/lsp_client/client.py +1642 -0
static_analyzer/lsp_client/diagnostics.py +62 -0
static_analyzer/lsp_client/java_client.py +517 -0
static_analyzer/lsp_client/language_settings.py +97 -0
static_analyzer/lsp_client/typescript_client.py +235 -0
static_analyzer/programming_language.py +152 -0
static_analyzer/reference_resolve_mixin.py +166 -0
static_analyzer/scanner.py +95 -0
static_analyzer/typescript_config_scanner.py +54 -0
tool_registry.py +433 -0
user_config.py +134 -0
utils.py +56 -0
vscode_constants.py +124 -0

diagram_analysis/analysis_json.py ADDED Viewed

@@ -0,0 +1,346 @@
+import logging
+from datetime import datetime, timezone
+from pydantic import BaseModel, Field
+from agents.agent_responses import Component, Relation, AnalysisInsights, assign_component_ids
+logger = logging.getLogger(__name__)
+class RelationJson(Relation):
+    """Relation subclass that includes src_id/dst_id in JSON serialization."""
+    src_id: str = Field(default="", description="Component ID of the source.")
+    dst_id: str = Field(default="", description="Component ID of the destination.")
+class ComponentJson(Component):
+    # Override to include in JSON serialization (parent has exclude=True)
+    component_id: str = Field(description="Deterministic unique identifier for this component.")
+    can_expand: bool = Field(
+        description="Whether the component can be expanded in detail or not.",
+        default=False,
+    )
+    assigned_files: list[str] = Field(
+        description="A list of source code names of files assigned to the component.",
+        default_factory=list,
+    )
+    # Nested sub-analysis for expanded components
+    components: list["ComponentJson"] | None = Field(
+        description="Sub-components if expanded, None otherwise.", default=None
+    )
+    components_relations: list[RelationJson] | None = Field(
+        description="Relations among sub-components if expanded, None otherwise.",
+        default=None,
+    )
+class NotAnalyzedFile(BaseModel):
+    path: str = Field(description="Relative path of the file.")
+    reason: str = Field(description="Exclusion reason for the file.")
+class FileCoverageSummary(BaseModel):
+    total_files: int = Field(description="Total number of text files in the repository.")
+    analyzed: int = Field(description="Number of files included in the analysis.")
+    not_analyzed: int = Field(description="Number of files excluded from the analysis.")
+    not_analyzed_by_reason: dict[str, int] = Field(
+        default_factory=dict, description="Count of excluded files grouped by reason."
+    )
+class FileCoverageReport(BaseModel):
+    version: int = Field(default=1, description="Schema version of the file coverage report.")
+    generated_at: str = Field(description="ISO timestamp of when the report was generated.")
+    analyzed_files: list[str] = Field(description="List of analyzed file paths.")
+    not_analyzed_files: list[NotAnalyzedFile] = Field(description="List of excluded files with optional reasons.")
+    summary: FileCoverageSummary = Field(description="Aggregated coverage counts.")
+class AnalysisMetadata(BaseModel):
+    generated_at: str = Field(description="ISO timestamp of when the analysis was generated.")
+    repo_name: str = Field(description="Name of the analyzed repository.")
+    depth_level: int = Field(description="Maximum depth level of the analysis.")
+    file_coverage_summary: FileCoverageSummary = Field(
+        default_factory=lambda: FileCoverageSummary(
+            total_files=0, analyzed=0, not_analyzed=0, not_analyzed_by_reason={}
+        ),
+        description="Lightweight file coverage counts.",
+    )
+class UnifiedAnalysisJson(BaseModel):
+    metadata: AnalysisMetadata = Field(description="Metadata about the analysis run.")
+    description: str = Field(
+        description="One paragraph explaining the functionality which is represented by this graph."
+    )
+    components: list[ComponentJson] = Field(description="List of the components identified in the project.")
+    components_relations: list[RelationJson] = Field(description="List of relations among the components.")
+def from_component_to_json_component(
+    component: Component,
+    expandable_components: list[Component],
+    sub_analyses: dict[str, tuple[AnalysisInsights, list[Component]]] | None = None,
+    processed_ids: set[str] | None = None,
+) -> ComponentJson:
+    """Convert a Component to a ComponentJson, optionally nesting sub-analysis data."""
+    if processed_ids is None:
+        processed_ids = set()
+    component_id_val: str = component.component_id
+    if component_id_val in processed_ids:
+        logger.warning(f"Component {component.name} (ID: {component_id_val}) already processed, skipping expansion")
+        can_expand = False
+    else:
+        processed_ids.add(component_id_val)
+        can_expand = any(c.component_id == component.component_id for c in expandable_components)
+    nested_components: list[ComponentJson] | None = None
+    nested_relations: list[RelationJson] | None = None
+    if can_expand and sub_analyses and component.component_id in sub_analyses:
+        sub_analysis, sub_expandable = sub_analyses[component.component_id]
+        nested_components = [
+            from_component_to_json_component(c, sub_expandable, sub_analyses, processed_ids)
+            for c in sub_analysis.components
+        ]
+        nested_relations = [
+            RelationJson(
+                relation=r.relation,
+                src_name=r.src_name,
+                dst_name=r.dst_name,
+                src_id=r.src_id,
+                dst_id=r.dst_id,
+            )
+            for r in sub_analysis.components_relations
+        ]
+    return ComponentJson(
+        name=component.name,
+        component_id=component.component_id,
+        description=component.description,
+        key_entities=component.key_entities,
+        source_cluster_ids=component.source_cluster_ids,
+        assigned_files=component.assigned_files,
+        can_expand=can_expand,
+        components=nested_components,
+        components_relations=nested_relations,
+    )
+def from_analysis_to_json(
+    analysis: AnalysisInsights,
+    expandable_components: list[Component],
+    sub_analyses: dict[str, tuple[AnalysisInsights, list[Component]]] | None = None,
+) -> str:
+    """Convert an AnalysisInsights to a flat JSON string (legacy-compatible, no metadata wrapper)."""
+    components_json = [
+        from_component_to_json_component(c, expandable_components, sub_analyses, None) for c in analysis.components
+    ]
+    # Build a dict matching the old AnalysisInsightsJson shape but with nested components
+    relations_json = [
+        RelationJson(
+            relation=r.relation,
+            src_name=r.src_name,
+            dst_name=r.dst_name,
+            src_id=r.src_id,
+            dst_id=r.dst_id,
+        )
+        for r in analysis.components_relations
+    ]
+    data = {
+        "description": analysis.description,
+        "components": [c.model_dump(exclude_none=True) for c in components_json],
+        "components_relations": [r.model_dump() for r in relations_json],
+    }
+    import json
+    return json.dumps(data, indent=2)
+def _compute_depth_level(
+    sub_analyses: dict[str, tuple[AnalysisInsights, list[Component]]] | None,
+) -> int:
+    """Compute the maximum depth level from the sub_analyses structure.
+    Returns 1 if there are no sub-analyses (root only), 2 if there is one level of
+    sub-analyses, etc. Recursively traverses nested sub-analyses to find true max depth.
+    """
+    if not sub_analyses:
+        return 1
+    def get_depth(analysis: AnalysisInsights, visited: set[str]) -> int:
+        """Recursively compute depth for a sub-analysis."""
+        max_depth = 1
+        for comp in analysis.components:
+            if comp.component_id in sub_analyses and comp.component_id not in visited:
+                visited.add(comp.component_id)
+                sub_analysis, _ = sub_analyses[comp.component_id]
+                child_depth = 1 + get_depth(sub_analysis, visited)
+                max_depth = max(max_depth, child_depth)
+                visited.remove(comp.component_id)
+        return max_depth
+    max_depth = 1
+    for cid, (sub_analysis, _) in sub_analyses.items():
+        # Only compute depth for root-level sub-analyses (not referenced by others)
+        is_root_level = True
+        for other_cid, (other_analysis, _) in sub_analyses.items():
+            if other_cid != cid:
+                for comp in other_analysis.components:
+                    if comp.component_id == cid:
+                        is_root_level = False
+                        break
+            if not is_root_level:
+                break
+        if is_root_level:
+            visited = {cid}
+            depth = 1 + get_depth(sub_analysis, visited)
+            max_depth = max(max_depth, depth)
+    return max_depth
+def build_unified_analysis_json(
+    analysis: AnalysisInsights,
+    expandable_components: list[Component],
+    repo_name: str,
+    sub_analyses: dict[str, tuple[AnalysisInsights, list[Component]]] | None = None,
+    file_coverage_summary: FileCoverageSummary | None = None,
+) -> str:
+    """Build the full unified analysis JSON with metadata and nested sub-analyses.
+    The depth_level metadata is computed automatically from the sub_analyses structure
+    if not provided explicitly.
+    """
+    components_json = [
+        from_component_to_json_component(c, expandable_components, sub_analyses, None) for c in analysis.components
+    ]
+    # Use default summary if none provided
+    if file_coverage_summary is None:
+        summary = FileCoverageSummary(total_files=0, analyzed=0, not_analyzed=0, not_analyzed_by_reason={})
+    else:
+        summary = file_coverage_summary
+    relations_json = [
+        RelationJson(
+            relation=r.relation,
+            src_name=r.src_name,
+            dst_name=r.dst_name,
+            src_id=r.src_id,
+            dst_id=r.dst_id,
+        )
+        for r in analysis.components_relations
+    ]
+    unified = UnifiedAnalysisJson(
+        metadata=AnalysisMetadata(
+            generated_at=datetime.now(timezone.utc).isoformat(),
+            repo_name=repo_name,
+            depth_level=_compute_depth_level(sub_analyses),
+            file_coverage_summary=summary,
+        ),
+        description=analysis.description,
+        components=components_json,
+        components_relations=relations_json,
+    )
+    return unified.model_dump_json(indent=2, exclude_none=True)
+def parse_unified_analysis(
+    data: dict,
+) -> tuple[AnalysisInsights, dict[str, AnalysisInsights]]:
+    """Parse a unified analysis JSON dict into root AnalysisInsights and sub-analyses.
+    Returns:
+        (root_analysis, sub_analyses_dict) where sub_analyses_dict maps component_id
+        to its nested AnalysisInsights.
+    """
+    sub_analyses: dict[str, AnalysisInsights] = {}
+    root_analysis = _extract_analysis_recursive(data, sub_analyses)
+    # Backward compatibility: if components lack component_id, assign deterministically
+    if any(c.component_id == "" for c in root_analysis.components):
+        _assign_ids_and_rekey(root_analysis, sub_analyses)
+    return root_analysis, sub_analyses
+def _assign_ids_and_rekey(
+    root_analysis: AnalysisInsights,
+    sub_analyses: dict[str, AnalysisInsights],
+) -> None:
+    """Assign component IDs to an analysis loaded from old JSON (without IDs) and re-key sub_analyses."""
+    from agents.agent_responses import ROOT_PARENT_ID
+    # Build old name -> sub_analysis mapping before clearing
+    old_subs = dict(sub_analyses)
+    sub_analyses.clear()
+    # Assign IDs to root and recursively to sub-analyses
+    _assign_ids_recursive(root_analysis, old_subs, sub_analyses, ROOT_PARENT_ID)
+def _assign_ids_recursive(
+    analysis: AnalysisInsights,
+    old_subs: dict[str, AnalysisInsights],
+    new_subs: dict[str, AnalysisInsights],
+    parent_id: str,
+) -> None:
+    """Recursively assign IDs and re-key sub_analyses from name-keyed to id-keyed."""
+    assign_component_ids(analysis, parent_id=parent_id)
+    for comp in analysis.components:
+        # Check if this component had a sub-analysis keyed by name
+        if comp.name in old_subs:
+            sub = old_subs[comp.name]
+            new_subs[comp.component_id] = sub
+            _assign_ids_recursive(sub, old_subs, new_subs, comp.component_id)
+def build_id_to_name_map(root_analysis: AnalysisInsights, sub_analyses: dict[str, AnalysisInsights]) -> dict[str, str]:
+    """Build a mapping from component_id to component name across all analysis levels."""
+    id_to_name: dict[str, str] = {c.component_id: c.name for c in root_analysis.components}
+    for sub_analysis in sub_analyses.values():
+        for comp in sub_analysis.components:
+            id_to_name[comp.component_id] = comp.name
+    return id_to_name
+def _extract_analysis_recursive(data: dict, sub_analyses: dict[str, AnalysisInsights]) -> AnalysisInsights:
+    """Recursively extract AnalysisInsights from data dict, collecting all sub-analyses.
+    Args:
+        data: The analysis data dict containing components, description, etc.
+        sub_analyses: Dict to populate with component_id -> AnalysisInsights mappings.
+    Returns:
+        AnalysisInsights for this level (components are non-nested at this level).
+    """
+    components: list[Component] = []
+    for comp_data in data.get("components", []):
+        # Create the component for this level (non-nested)
+        component = Component(
+            name=comp_data["name"],
+            component_id=comp_data.get("component_id", ""),
+            description=comp_data["description"],
+            key_entities=comp_data.get("key_entities", []),
+            assigned_files=comp_data.get("assigned_files", []),
+            source_cluster_ids=comp_data.get("source_cluster_ids", []),
+        )
+        components.append(component)
+        # Recursively process nested components if they exist
+        nested_components = comp_data.get("components")
+        if nested_components is not None:
+            sub_analysis = _extract_analysis_recursive(comp_data, sub_analyses)
+            sub_analyses[component.component_id or comp_data["name"]] = sub_analysis
+    return AnalysisInsights(
+        description=data.get("description", ""),
+        components=components,
+        components_relations=[Relation(**r) for r in data.get("components_relations", [])],
+    )