PyPI - bioguider - Versions diffs - 0.2.32__py3-none-any.whl → 0.2.34__py3-none-any.whl - Mend

bioguider 0.2.32py3-none-any.whl → 0.2.34py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of bioguider might be problematic. Click here for more details.

Files changed (9) hide show

bioguider/generation/llm_injector.py CHANGED Viewed

@@ -115,13 +115,9 @@ class LLMErrorInjector:
             max_words=max_words,
         )
         output, _ = conv.generate(system_prompt=system_prompt, instruction_prompt="Return the JSON now.")
-        try:
-            data = json.loads(output)
-        except Exception:
-            # try to locate JSON block
-            start = output.find("{")
-            end = output.rfind("}")
-            data = json.loads(output[start:end+1]) if start != -1 and end != -1 else {"corrupted_markdown": readme_text, "errors": []}
+        # Enhanced JSON parsing with better error handling
+        data = self._parse_json_output(output, readme_text)
         corrupted = data.get("corrupted_markdown", readme_text)
         # Validate output stays within original context; fallback to deterministic if invalid
         if not self._validate_corrupted(readme_text, corrupted, preserve_keywords):
@@ -133,6 +129,63 @@ class LLMErrorInjector:
         }
         return corrupted, manifest
+    def _parse_json_output(self, output: str, fallback_text: str) -> Dict[str, Any]:
+        """Enhanced JSON parsing with multiple fallback strategies."""
+        import re
+        # Strategy 1: Direct JSON parsing
+        try:
+            return json.loads(output)
+        except json.JSONDecodeError:
+            pass
+        # Strategy 2: Extract JSON block between ```json and ```
+        json_pattern = r'```(?:json)?\s*(\{.*?\})\s*```'
+        match = re.search(json_pattern, output, re.DOTALL)
+        if match:
+            try:
+                return json.loads(match.group(1))
+            except json.JSONDecodeError:
+                pass
+        # Strategy 3: Find first complete JSON object
+        start = output.find("{")
+        if start != -1:
+            # Find matching closing brace
+            brace_count = 0
+            end = start
+            for i, char in enumerate(output[start:], start):
+                if char == "{":
+                    brace_count += 1
+                elif char == "}":
+                    brace_count -= 1
+                    if brace_count == 0:
+                        end = i
+                        break
+            if brace_count == 0:  # Found complete JSON object
+                try:
+                    json_str = output[start:end+1]
+                    return json.loads(json_str)
+                except json.JSONDecodeError:
+                    pass
+        # Strategy 4: Try to fix common JSON issues
+        try:
+            # Remove markdown code fences
+            cleaned = re.sub(r'```(?:json)?\s*', '', output)
+            cleaned = re.sub(r'```\s*$', '', cleaned)
+            # Remove leading/trailing whitespace
+            cleaned = cleaned.strip()
+            # Try parsing again
+            return json.loads(cleaned)
+        except json.JSONDecodeError:
+            pass
+        # Strategy 5: Fallback to deterministic injection
+        print(f"Warning: Failed to parse LLM JSON output, using fallback. Output preview: {output[:200]}...")
+        return {"corrupted_markdown": fallback_text, "errors": []}
     def _extract_preserve_keywords(self, text: str) -> List[str]:
         # Extract capitalized terms, domain hyphenations, and hostnames in links
         kws: Set[str] = set()

bioguider/generation/suggestion_extractor.py CHANGED Viewed

@@ -21,7 +21,7 @@ class SuggestionExtractor:
                             id=f"readme-dependencies-{file_name}",
                             category="readme.dependencies",
                             severity="should_fix",
-                            source={"section": "readme", "field": "dependency_suggestions", "evidence": dep_suggestions, "score": dep_score},
+                            source={"section": "readme", "field": "dependency_suggestions", "score": dep_score},
                             target_files=[file_name],
                             action="add_dependencies_section",
                             anchor_hint="Dependencies",
@@ -36,7 +36,7 @@ class SuggestionExtractor:
                             id=f"readme-hardware-{file_name}",
                             category="readme.hardware",
                             severity="should_fix",
-                            source={"section": "readme", "field": "hardware_and_software_spec_suggestions", "evidence": hw_sw_suggestions, "score": hw_sw_score},
+                            source={"section": "readme", "field": "hardware_and_software_spec_suggestions", "score": hw_sw_score},
                             target_files=[file_name],
                             action="add_system_requirements_section",
                             anchor_hint="System Requirements",
@@ -51,7 +51,7 @@ class SuggestionExtractor:
                             id=f"readme-purpose-{file_name}",
                             category="readme.purpose",
                             severity="should_fix",
-                            source={"section": "readme", "field": "project_purpose_suggestions", "evidence": purpose_suggestions, "score": purpose_score},
+                            source={"section": "readme", "field": "project_purpose_suggestions", "score": purpose_score},
                             target_files=[file_name],
                             action="full_replace",
                             anchor_hint="Overview",
@@ -66,7 +66,7 @@ class SuggestionExtractor:
                             id=f"readme-readability-{file_name}",
                             category="readme.readability",
                             severity="should_fix",
-                            source={"section": "readme", "field": "readability_suggestions", "evidence": readability_suggestions, "score": readability_score},
+                            source={"section": "readme", "field": "readability_suggestions", "score": readability_score},
                             target_files=[file_name],
                             action="full_replace",
                             anchor_hint="Introduction",
@@ -78,7 +78,7 @@ class SuggestionExtractor:
                         id=f"readme-intro-cleanup-{file_name}",
                         category="readme.intro_cleanup",
                         severity="should_fix",
-                        source={"section": "readme", "field": "overview", "evidence": "Improve top-level overview for clarity and tone.", "score": "Fair"},
+                        source={"section": "readme", "field": "overview", "score": "Fair"},
                         target_files=[file_name],
                         action="replace_intro",
                         anchor_hint="Overview",
@@ -92,7 +92,7 @@ class SuggestionExtractor:
                             id=f"readme-dependencies-clarify-{file_name}",
                             category="readme.dependencies",
                             severity="should_fix",
-                            source={"section": "readme", "field": "dependencies", "evidence": str(dep_sugg), "score": dep_score},
+                            source={"section": "readme", "field": "dependencies", "score": dep_score},
                             target_files=[file_name],
                             action="add_dependencies_section",
                             anchor_hint="Dependencies",
@@ -103,7 +103,7 @@ class SuggestionExtractor:
                             id=f"readme-dependencies-fallback-{file_name}",
                             category="readme.dependencies",
                             severity="should_fix",
-                            source={"section": "readme", "field": "dependencies", "evidence": f"score={dep_score}", "score": dep_score},
+                            source={"section": "readme", "field": "dependencies", "score": dep_score},
                             target_files=[file_name],
                             action="add_dependencies_section",
                             anchor_hint="Dependencies",
@@ -118,7 +118,7 @@ class SuggestionExtractor:
                             id=f"readme-sysreq-clarify-{file_name}",
                             category="readme.system_requirements",
                             severity="should_fix",
-                            source={"section": "readme", "field": "hardware_and_software", "evidence": str(hw_sugg), "score": hw_score},
+                            source={"section": "readme", "field": "hardware_and_software", "score": hw_score},
                             target_files=[file_name],
                             action="add_system_requirements_section",
                             anchor_hint="System Requirements",
@@ -129,7 +129,7 @@ class SuggestionExtractor:
                             id=f"readme-sysreq-fallback-{file_name}",
                             category="readme.system_requirements",
                             severity="should_fix",
-                            source={"section": "readme", "field": "hardware_and_software", "evidence": f"score={hw_score}", "score": hw_score},
+                            source={"section": "readme", "field": "hardware_and_software", "score": hw_score},
                             target_files=[file_name],
                             action="add_system_requirements_section",
                             anchor_hint="System Requirements",
@@ -144,7 +144,7 @@ class SuggestionExtractor:
                             id=f"readme-license-{file_name}",
                             category="readme.license",
                             severity="nice_to_have",
-                            source={"section": "readme", "field": "license", "evidence": str(lic_sugg)},
+                            source={"section": "readme", "field": "license"},
                             target_files=[file_name],
                             action="mention_license_section",
                             anchor_hint="License",
@@ -159,7 +159,7 @@ class SuggestionExtractor:
                             id=f"readme-structure-clarify-{file_name}",
                             category="readme.readability",
                             severity="should_fix",
-                            source={"section": "readability", "field": "readability_suggestions", "evidence": str(read_sugg), "score": read_score},
+                            source={"section": "readability", "field": "readability_suggestions", "score": read_score},
                             target_files=[file_name],
                             action="normalize_headings_structure",
                             anchor_hint="Installation",
@@ -170,7 +170,7 @@ class SuggestionExtractor:
                             id=f"readme-structure-fallback-{file_name}",
                             category="readme.readability",
                             severity="should_fix",
-                            source={"section": "readability", "field": "readability_score", "evidence": f"score={read_score}", "score": read_score},
+                            source={"section": "readability", "field": "readability_score", "score": read_score},
                             target_files=[file_name],
                             action="normalize_headings_structure",
                             anchor_hint="Installation",
@@ -182,7 +182,7 @@ class SuggestionExtractor:
                                 id=f"readme-usage-{file_name}",
                                 category="readme.usage",
                                 severity="nice_to_have",
-                                source={"section": "readability", "field": "usage", "evidence": "Add Usage section as suggested."},
+                                source={"section": "readability", "field": "usage"},
                                 target_files=[file_name],
                                 action="add_usage_section",
                                 anchor_hint="Usage",
@@ -208,7 +208,7 @@ class SuggestionExtractor:
                             id=f"install-full-replace-{target}",
                             category="installation.full_replace",
                             severity="should_fix",
-                            source={"section": "installation", "field": "overall", "evidence": str(structured)},
+                            source={"section": "installation", "field": "overall"},
                             target_files=[target],
                             action="full_replace",
                             anchor_hint=None,
@@ -235,7 +235,7 @@ class SuggestionExtractor:
                                     id=f"userguide-readability-{file_name}-{i}",
                                     category="userguide.readability",
                                     severity="should_fix",
-                                    source={"section": "userguide", "field": "readability_suggestions", "evidence": suggestion, "score": readability_score},
+                                    source={"section": "userguide", "field": "readability_suggestions", "score": readability_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint=f"Readability-{i+1}",
@@ -252,7 +252,7 @@ class SuggestionExtractor:
                                     id=f"userguide-context-{file_name}-{i}",
                                     category="userguide.context",
                                     severity="should_fix",
-                                    source={"section": "userguide", "field": "context_and_purpose_suggestions", "evidence": suggestion, "score": context_score},
+                                    source={"section": "userguide", "field": "context_and_purpose_suggestions", "score": context_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint=f"Context-{i+1}",
@@ -269,7 +269,7 @@ class SuggestionExtractor:
                                     id=f"userguide-error-{file_name}-{i}",
                                     category="userguide.error_handling",
                                     severity="should_fix",
-                                    source={"section": "userguide", "field": "error_handling_suggestions", "evidence": suggestion, "score": error_score},
+                                    source={"section": "userguide", "field": "error_handling_suggestions", "score": error_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint=f"Error-Handling-{i+1}",
@@ -284,7 +284,7 @@ class SuggestionExtractor:
                             id=f"userguide-consistency-{file_name}",
                             category="userguide.consistency",
                             severity="should_fix",
-                            source={"section": "userguide", "field": "consistency", "evidence": f"score={score}"},
+                            source={"section": "userguide", "field": "consistency", "score": score},
                             target_files=[file_name],
                             action="full_replace",
                             anchor_hint="Examples",
@@ -309,7 +309,7 @@ class SuggestionExtractor:
                                     id=f"tutorial-readability-{file_name}-{i}",
                                     category="tutorial.readability",
                                     severity="should_fix",
-                                    source={"section": "tutorial", "field": "readability_suggestions", "evidence": suggestion, "score": readability_score},
+                                    source={"section": "tutorial", "field": "readability_suggestions", "score": readability_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint="Introduction",
@@ -326,7 +326,7 @@ class SuggestionExtractor:
                                     id=f"tutorial-setup-{file_name}-{i}",
                                     category="tutorial.setup",
                                     severity="should_fix",
-                                    source={"section": "tutorial", "field": "setup_and_dependencies_suggestions", "evidence": suggestion, "score": setup_score},
+                                    source={"section": "tutorial", "field": "setup_and_dependencies_suggestions", "score": setup_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint="Setup",
@@ -343,7 +343,7 @@ class SuggestionExtractor:
                                     id=f"tutorial-reproducibility-{file_name}-{i}",
                                     category="tutorial.reproducibility",
                                     severity="should_fix",
-                                    source={"section": "tutorial", "field": "reproducibility_suggestions", "evidence": suggestion, "score": reproducibility_score},
+                                    source={"section": "tutorial", "field": "reproducibility_suggestions", "score": reproducibility_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint="Setup",
@@ -360,7 +360,7 @@ class SuggestionExtractor:
                                     id=f"tutorial-structure-{file_name}-{i}",
                                     category="tutorial.structure",
                                     severity="should_fix",
-                                    source={"section": "tutorial", "field": "structure_and_navigation_suggestions", "evidence": suggestion, "score": structure_score},
+                                    source={"section": "tutorial", "field": "structure_and_navigation_suggestions", "score": structure_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint="Introduction",
@@ -377,7 +377,7 @@ class SuggestionExtractor:
                                     id=f"tutorial-code-{file_name}-{i}",
                                     category="tutorial.code_quality",
                                     severity="should_fix",
-                                    source={"section": "tutorial", "field": "executable_code_quality_suggestions", "evidence": suggestion, "score": code_score},
+                                    source={"section": "tutorial", "field": "executable_code_quality_suggestions", "score": code_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint="Code Examples",
@@ -394,7 +394,7 @@ class SuggestionExtractor:
                                     id=f"tutorial-verification-{file_name}-{i}",
                                     category="tutorial.verification",
                                     severity="should_fix",
-                                    source={"section": "tutorial", "field": "result_verification_suggestions", "evidence": suggestion, "score": verification_score},
+                                    source={"section": "tutorial", "field": "result_verification_suggestions", "score": verification_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint="Results",
@@ -411,7 +411,7 @@ class SuggestionExtractor:
                                     id=f"tutorial-performance-{file_name}-{i}",
                                     category="tutorial.performance",
                                     severity="should_fix",
-                                    source={"section": "tutorial", "field": "performance_and_resource_notes_suggestions", "evidence": suggestion, "score": performance_score},
+                                    source={"section": "tutorial", "field": "performance_and_resource_notes_suggestions", "score": performance_score},
                                     target_files=[file_name],
                                     action="full_replace",
                                     anchor_hint="Performance",
@@ -424,7 +424,7 @@ class SuggestionExtractor:
                             id=f"tutorial-consistency-{file_name}",
                             category="tutorial.consistency",
                             severity="should_fix",
-                            source={"section": "tutorial", "field": "consistency", "evidence": f"score={score}"},
+                            source={"section": "tutorial", "field": "consistency", "score": score},
                             target_files=[file_name],
                             action="full_replace",
                             anchor_hint=None,

bioguider/managers/generation_manager.py CHANGED Viewed

@@ -34,6 +34,7 @@ class DocumentationGenerationManager:
         self.output = OutputManager(base_outputs_dir=output_dir)
         self.llm_gen = LLMContentGenerator(llm)
         self.llm_cleaner = LLMCleaner(llm)
     def print_step(self, step_name: str | None = None, step_output: str | None = None):
         if self.step_callback is None:
@@ -143,54 +144,176 @@ class DocumentationGenerationManager:
             self.print_step(step_name="ProcessingFile", step_output=f"Processing {fpath} ({processed_files}/{total_files}) - {len(edits)} edits")
             original_content = files.get(fpath, "")
+            # Group suggestions by file to avoid duplicate generation
+            file_suggestions = []
+            full_replace_edits = []
+            section_edits = []
+            for e in edits:
+                suggestion = next((s for s in suggestions if s.id == e.suggestion_id), None) if e.suggestion_id else None
+                if suggestion:
+                    file_suggestions.append(suggestion)
+                    if e.edit_type == "full_replace":
+                        full_replace_edits.append(e)
+                    else:
+                        section_edits.append(e)
+            # Debug: Save suggestion grouping info
+            import json
+            import os
+            from datetime import datetime
+            debug_dir = "outputs/debug_generation"
+            os.makedirs(debug_dir, exist_ok=True)
+            safe_filename = fpath.replace("/", "_").replace(".", "_")
+            grouping_info = {
+                "file_path": fpath,
+                "total_edits": len(edits),
+                "file_suggestions_count": len(file_suggestions),
+                "full_replace_edits_count": len(full_replace_edits),
+                "section_edits_count": len(section_edits),
+                "suggestions": [
+                    {
+                        "id": s.id,
+                        "category": s.category,
+                        "content_guidance": s.content_guidance[:200] + "..." if len(s.content_guidance or "") > 200 else s.content_guidance,
+                        "target_files": s.target_files
+                    } for s in file_suggestions
+                ],
+                "timestamp": datetime.now().isoformat()
+            }
+            grouping_file = os.path.join(debug_dir, f"{safe_filename}_grouping.json")
+            with open(grouping_file, 'w', encoding='utf-8') as f:
+                json.dump(grouping_info, f, indent=2, ensure_ascii=False)
             content = original_content
             total_stats = {"added_lines": 0}
-            for e in edits:
-                context = original_content
-                if not e.content_template or e.content_template.strip() == "":
-                    # Generate LLM content - use full document generation for full_replace, section generation for others
-                    suggestion = next((s for s in suggestions if s.id == e.suggestion_id), None) if e.suggestion_id else None
-                    if suggestion:
-                        if e.edit_type == "full_replace":
-                            self.print_step(step_name="GeneratingContent", step_output=f"Generating full document for {e.suggestion_id} using LLM...")
+            # CRITICAL: Generate content ONCE per file if there are full_replace edits
+            # All suggestions for this file are merged into a single evaluation report
+            # This prevents duplicate content generation
+            if full_replace_edits:
+                self.print_step(
+                    step_name="GeneratingContent",
+                    step_output=f"🔄 Generating full document for {fpath} with {len(file_suggestions)} suggestions using LLM (SINGLE CALL)..."
+                )
+                # Merge all suggestions for this file into a single evaluation report
+                # Format suggestions with clear numbering to help LLM understand they're separate improvements
+                suggestions_list = []
+                for idx, s in enumerate(file_suggestions, 1):
+                    suggestions_list.append({
+                        "suggestion_number": idx,
+                        "category": s.category if hasattr(s, 'category') else "general",
+                        "content_guidance": s.content_guidance
+                    })
+                merged_evaluation_report = {
+                    "total_suggestions": len(file_suggestions),
+                    "integration_instruction": f"Integrate ALL {len(file_suggestions)} suggestions below into ONE cohesive document. Do NOT create {len(file_suggestions)} separate versions.",
+                    "suggestions": suggestions_list
+                }
+                # Debug: Save merged evaluation report
+                merged_report_file = os.path.join(debug_dir, f"{safe_filename}_merged_report.json")
+                with open(merged_report_file, 'w', encoding='utf-8') as f:
+                    json.dump(merged_evaluation_report, f, indent=2, ensure_ascii=False)
+                # Debug: Log that we're about to make a single generation call
+                debug_log_file = os.path.join(debug_dir, f"{safe_filename}_generation_log.txt")
+                with open(debug_log_file, 'a', encoding='utf-8') as f:
+                    f.write(f"\n=== GENERATION CALL at {datetime.now().isoformat()} ===\n")
+                    f.write(f"File: {fpath}\n")
+                    f.write(f"Full replace edits: {len(full_replace_edits)}\n")
+                    f.write(f"Total suggestions: {len(file_suggestions)}\n")
+                    f.write(f"Merged into single call: YES\n")
+                    f.write(f"Suggestion IDs: {[s.id for s in file_suggestions]}\n\n")
+                    gen_content, gen_usage = self.llm_gen.generate_full_document(
+                        target_file=fpath,
+                        evaluation_report=merged_evaluation_report,
+                        context=original_content,
+                        original_content=original_content,
+                    )
+                # Debug: Log completion
+                with open(debug_log_file, 'a', encoding='utf-8') as f:
+                    f.write(f"Generation completed at {datetime.now().isoformat()}\n")
+                    f.write(f"Content length: {len(gen_content) if isinstance(gen_content, str) else 0} characters\n")
+                    f.write(f"Tokens used: {gen_usage.get('total_tokens', 0)}\n")
+                    f.write(f"SUCCESS: {isinstance(gen_content, str) and gen_content}\n\n")
+                if isinstance(gen_content, str) and gen_content:
+                    self.print_step(step_name="LLMFullDoc", step_output=f"✓ Generated full document for {fpath} ({gen_usage.get('total_tokens', 0)} tokens)")
+                    # Apply the generated content to all full_replace edits
+                    for e in full_replace_edits:
+                        e.content_template = gen_content
+                    content = gen_content
+                else:
+                    # Fallback: try individual generation but only for the first edit to avoid duplicates
+                    if full_replace_edits:
+                        e = full_replace_edits[0]  # Only process the first edit
+                        suggestion = next((s for s in suggestions if s.id == e.suggestion_id), None) if e.suggestion_id else None
+                        if suggestion and (not e.content_template or e.content_template.strip() == ""):
+                            self.print_step(step_name="GeneratingContent", step_output=f"Fallback: Generating full document for {e.suggestion_id} using LLM...")
                             gen_content, gen_usage = self.llm_gen.generate_full_document(
                                 target_file=e.file_path,
-                                evaluation_report={"suggestion": suggestion.content_guidance, "evidence": suggestion.source.get("evidence", "") if suggestion.source else ""},
-                                context=context,
+                                evaluation_report={"suggestion": suggestion.content_guidance},
+                                context=original_content,
+                                original_content=original_content,
                             )
                             if isinstance(gen_content, str) and gen_content:
                                 self.print_step(step_name="LLMFullDoc", step_output=f"✓ Generated full document for {e.suggestion_id} ({gen_usage.get('total_tokens', 0)} tokens)")
-                                e.content_template = gen_content
-                        else:
-                            self.print_step(step_name="GeneratingContent", step_output=f"Generating section for {e.suggestion_id} using LLM...")
-                            gen_section, gen_usage = self.llm_gen.generate_section(
-                                suggestion=suggestion,
-                                style=plan.style_profile,
-                                context=context,
-                            )
-                            if isinstance(gen_section, str) and gen_section:
-                                self.print_step(step_name="LLMSection", step_output=f"✓ Generated section for {e.suggestion_id} ({gen_usage.get('total_tokens', 0)} tokens)")
-                                # Ensure header present
-                                if gen_section.lstrip().startswith("#"):
-                                    e.content_template = gen_section
-                                else:
-                                    title = e.anchor.get('value', '').strip() or ''
-                                    e.content_template = f"## {title}\n\n{gen_section}" if title else gen_section
-                content, stats = self.renderer.apply_edit(content, e)
-                # After applying full document or section changes, run a general cleaner pass for all text files
-                # to fix markdown/formatting issues without changing meaning.
-                try:
-                    if fpath.endswith((".md", ".rst", ".Rmd", ".Rd")) and content:
-                        self.print_step(step_name="CleaningContent", step_output=f"Cleaning formatting for {fpath}...")
-                        cleaned, _usage = self.llm_cleaner.clean_readme(content)
-                        if isinstance(cleaned, str) and cleaned.strip():
-                            content = cleaned
+                                # Apply the same content to all full_replace edits
+                                for edit in full_replace_edits:
+                                    edit.content_template = gen_content
+                                content = gen_content
+            else:
+                # Handle section edits individually
+                for e in section_edits:
+                    suggestion = next((s for s in suggestions if s.id == e.suggestion_id), None) if e.suggestion_id else None
+                    if suggestion and (not e.content_template or e.content_template.strip() == ""):
+                        self.print_step(step_name="GeneratingContent", step_output=f"Generating section for {e.suggestion_id} using LLM...")
+                        gen_section, gen_usage = self.llm_gen.generate_section(
+                            suggestion=suggestion,
+                            style=plan.style_profile,
+                            context=original_content,
+                        )
+                        if isinstance(gen_section, str) and gen_section:
+                            self.print_step(step_name="LLMSection", step_output=f"✓ Generated section for {e.suggestion_id} ({gen_usage.get('total_tokens', 0)} tokens)")
+                            # Ensure header present
+                            if gen_section.lstrip().startswith("#"):
+                                e.content_template = gen_section
+                            else:
+                                title = e.anchor.get('value', '').strip() or ''
+                                e.content_template = f"## {title}\n\n{gen_section}" if title else gen_section
+                    content, stats = self.renderer.apply_edit(content, e)
+                    total_stats["added_lines"] = total_stats.get("added_lines", 0) + stats.get("added_lines", 0)
+            # Apply remaining edits that weren't full_replace
+            for e in edits:
+                if e.edit_type != "full_replace":
+                    content, stats = self.renderer.apply_edit(content, e)
+                    total_stats["added_lines"] = total_stats.get("added_lines", 0) + stats.get("added_lines", 0)
+            # After applying full document or section changes, run a general cleaner pass for all text files
+            # to fix markdown/formatting issues without changing meaning.
+            try:
+                if fpath.endswith((".md", ".rst", ".Rmd", ".Rd")) and content:
+                    self.print_step(step_name="CleaningContent", step_output=f"Cleaning formatting for {fpath}...")
+                    cleaned, _usage = self.llm_cleaner.clean_readme(content)
+                    if isinstance(cleaned, str) and cleaned.strip():
+                        content = cleaned
+                    # LLM cleaner now handles markdown fences and unwanted summaries
-                        # LLM cleaner now handles markdown fences and unwanted summaries
-                except Exception:
-                    pass
-                total_stats["added_lines"] = total_stats.get("added_lines", 0) + stats.get("added_lines", 0)
+            except Exception:
+                pass
             revised[fpath] = content
             diff_stats[fpath] = total_stats
             self.print_step(step_name="RenderedFile", step_output=f"✓ Completed {fpath} - added {total_stats['added_lines']} lines")
@@ -373,7 +496,6 @@ class DocumentationGenerationManager:
             for e in edits:
                 sug = next((s for s in suggestions if s.id == e.suggestion_id), None)
                 guidance = sug.content_guidance if sug else ""
-                evidence = sug.source.get("evidence", "") if sug and sug.source else ""
                 section = e.anchor.get('value', 'General improvements')
                 # Convert technical action names to user-friendly descriptions
@@ -445,61 +567,18 @@ class DocumentationGenerationManager:
                 # Show evaluation reasoning that triggered this improvement
                 if sug and sug.source:
-                    evidence = sug.source.get("evidence", "")
                     score = sug.source.get("score", "")
                     category = sug.category or ""
                     # Format category for display (e.g., "readme.dependencies" -> "Dependencies")
                     category_display = category.split('.')[-1].replace('_', ' ').title() if category else ""
-                    if evidence:
-                        # Handle different evidence types
-                        if isinstance(evidence, dict):
-                            # Extract key information from dict evidence
-                            evidence_text = evidence.get("dependency_suggestions", "") or evidence.get("evidence", "")
-                            if not evidence_text:
-                                evidence_text = f"Installation evaluation: {evidence.get('overall_score', 'Unknown')} score"
-                        else:
-                            evidence_text = str(evidence)
-                            # Handle Python dict string evidence (from full_replace actions)
-                            if evidence_text.startswith("{") and evidence_text.endswith("}"):
-                                try:
-                                    import ast
-                                    evidence_dict = ast.literal_eval(evidence_text)
-                                    # Extract specific suggestions from the evaluation report
-                                    dep_sugg = evidence_dict.get("dependency_suggestions", "")
-                                    hw_req = evidence_dict.get("hardware_requirements", False)
-                                    compat_os = evidence_dict.get("compatible_os", True)
-                                    overall_score = evidence_dict.get("overall_score", "")
-                                    # Build specific reason based on evaluation findings
-                                    reasons = []
-                                    if dep_sugg:
-                                        reasons.append(f"Dependencies: {dep_sugg}")
-                                    if hw_req is False:
-                                        reasons.append("Hardware requirements not specified")
-                                    if compat_os is False:
-                                        reasons.append("Operating system compatibility unclear")
-                                    if overall_score and overall_score not in ("Excellent", "Good"):
-                                        reasons.append(f"Overall score: {overall_score}")
-                                    if reasons:
-                                        evidence_text = "; ".join(reasons)
-                                    else:
-                                        evidence_text = f"Installation evaluation score: {overall_score}"
-                                except:
-                                    evidence_text = "Installation documentation needs improvement"
-                        if score and category_display:
-                            lines.append(f"  - *Reason:* [{category_display} - {score}] {evidence_text}")
-                        elif score:
-                            lines.append(f"  - *Reason:* [{score}] {evidence_text}")
-                        elif category_display:
-                            lines.append(f"  - *Reason:* [{category_display}] {evidence_text}")
-                        else:
-                            lines.append(f"  - *Reason:* {evidence_text}")
+                    if score and category_display:
+                        lines.append(f"  - *Reason:* [{category_display} - {score}]")
                     elif score:
-                        lines.append(f"  - *Reason:* Evaluation score was '{score}' - needs improvement")
+                        lines.append(f"  - *Reason:* [{score}]")
+                    elif category_display:
+                        lines.append(f"  - *Reason:* [{category_display}]")
                 # Show what was actually implemented (different from reason)
                 if guidance:

{bioguider-0.2.32.dist-info → bioguider-0.2.34.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: bioguider
-Version: 0.2.32
+Version: 0.2.34
 Summary: An AI-Powered package to help biomedical developers to generate clear documentation
 License: MIT
 Author: Cankun Wang

bioguider 0.2.32__py3-none-any.whl → 0.2.34__py3-none-any.whl

Potentially problematic release.

bioguider 0.2.32py3-none-any.whl → 0.2.34py3-none-any.whl