PyPI - pdd-cli - Versions diffs - 0.0.23__py3-none-any.whl → 0.0.25__py3-none-any.whl - Mend

pdd-cli 0.0.23py3-none-any.whl → 0.0.25py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of pdd-cli might be problematic. Click here for more details.

Files changed (49) hide show

pdd/__init__.py +7 -1
pdd/bug_main.py +21 -3
pdd/bug_to_unit_test.py +16 -5
pdd/change.py +2 -1
pdd/change_main.py +407 -189
pdd/cli.py +853 -301
pdd/code_generator.py +2 -1
pdd/conflicts_in_prompts.py +2 -1
pdd/construct_paths.py +377 -222
pdd/context_generator.py +2 -1
pdd/continue_generation.py +3 -2
pdd/crash_main.py +55 -20
pdd/data/llm_model.csv +8 -8
pdd/detect_change.py +2 -1
pdd/fix_code_loop.py +465 -160
pdd/fix_code_module_errors.py +7 -4
pdd/fix_error_loop.py +9 -9
pdd/fix_errors_from_unit_tests.py +207 -365
pdd/fix_main.py +31 -4
pdd/fix_verification_errors.py +285 -0
pdd/fix_verification_errors_loop.py +975 -0
pdd/fix_verification_main.py +412 -0
pdd/generate_output_paths.py +427 -183
pdd/generate_test.py +3 -2
pdd/increase_tests.py +2 -2
pdd/llm_invoke.py +18 -8
pdd/pdd_completion.zsh +38 -1
pdd/preprocess.py +3 -3
pdd/process_csv_change.py +466 -154
pdd/prompts/extract_prompt_split_LLM.prompt +7 -4
pdd/prompts/extract_prompt_update_LLM.prompt +11 -5
pdd/prompts/extract_unit_code_fix_LLM.prompt +2 -2
pdd/prompts/find_verification_errors_LLM.prompt +25 -0
pdd/prompts/fix_code_module_errors_LLM.prompt +29 -0
pdd/prompts/fix_errors_from_unit_tests_LLM.prompt +5 -5
pdd/prompts/fix_verification_errors_LLM.prompt +20 -0
pdd/prompts/generate_test_LLM.prompt +9 -3
pdd/prompts/split_LLM.prompt +3 -3
pdd/prompts/update_prompt_LLM.prompt +3 -3
pdd/split.py +13 -12
pdd/split_main.py +22 -13
pdd/trace_main.py +7 -0
pdd/xml_tagger.py +2 -1
{pdd_cli-0.0.23.dist-info → pdd_cli-0.0.25.dist-info}/METADATA +4 -4
{pdd_cli-0.0.23.dist-info → pdd_cli-0.0.25.dist-info}/RECORD +49 -44
{pdd_cli-0.0.23.dist-info → pdd_cli-0.0.25.dist-info}/WHEEL +1 -1
{pdd_cli-0.0.23.dist-info → pdd_cli-0.0.25.dist-info}/entry_points.txt +0 -0
{pdd_cli-0.0.23.dist-info → pdd_cli-0.0.25.dist-info}/licenses/LICENSE +0 -0
{pdd_cli-0.0.23.dist-info → pdd_cli-0.0.25.dist-info}/top_level.txt +0 -0

pdd/fix_main.py CHANGED Viewed

@@ -2,10 +2,12 @@ import sys
 from typing import Tuple, Optional
 import click
 from rich import print as rprint
+from rich.markup import MarkupError, escape
 import requests
 import asyncio
 import os
+from pathlib import Path
 from .preprocess import preprocess
@@ -15,6 +17,9 @@ from .fix_error_loop import fix_error_loop
 from .get_jwt_token import get_jwt_token
 from .get_language import get_language
+# Import DEFAULT_STRENGTH from the package
+from . import DEFAULT_STRENGTH
 def fix_main(
     ctx: click.Context,
     prompt_file: str,
@@ -65,6 +70,12 @@ def fix_main(
     analysis_results = None
     try:
+        # Verify error file exists if not in loop mode
+        if not loop:
+            error_path = Path(error_file)
+            if not error_path.exists():
+                raise FileNotFoundError(f"Error file '{error_file}' does not exist.")
         # Construct file paths
         input_file_paths = {
             "prompt_file": prompt_file,
@@ -85,11 +96,12 @@ def fix_main(
             force=ctx.obj.get('force', False),
             quiet=ctx.obj.get('quiet', False),
             command="fix",
-            command_options=command_options
+            command_options=command_options,
+            create_error_file=loop  # Only create error file if in loop mode
         )
         # Get parameters from context
-        strength = ctx.obj.get('strength', 0.9)
+        strength = ctx.obj.get('strength', DEFAULT_STRENGTH)
         temperature = ctx.obj.get('temperature', 0)
         verbose = ctx.obj.get('verbose', False)
         if loop:
@@ -139,7 +151,16 @@ def fix_main(
             if verbose and analysis_results:
                 # Log the first 200 characters of analysis if in verbose mode
                 analysis_preview = analysis_results[:200] + "..." if len(analysis_results) > 200 else analysis_results
-                rprint(f"[bold]Analysis preview:[/bold] {analysis_preview}")
+                try:
+                    # Attempt to print the preview using rich markup parsing
+                    rprint(f"[bold]Analysis preview:[/bold] {analysis_preview}")
+                except MarkupError as me:
+                    # If markup fails, print a warning and the escaped preview
+                    rprint(f"[bold yellow]Warning:[/bold yellow] Analysis preview contained invalid markup: {me}")
+                    rprint(f"[bold]Raw Analysis preview (escaped):[/bold] {escape(analysis_preview)}")
+                except Exception as e:
+                    # Handle other potential errors during preview printing
+                    rprint(f"[bold red]Error printing analysis preview: {e}[/bold red]")
             if success:
                 rprint("[bold green]Fixed files saved:[/bold green]")
                 rprint(f"  Test file: {output_file_paths['output_test']}")
@@ -263,5 +284,11 @@ def fix_main(
     except Exception as e:
         if not ctx.obj.get('quiet', False):
-            rprint(f"[bold red]Error:[/bold red] {str(e)}")
+            # Safely handle and print MarkupError
+            if isinstance(e, MarkupError):
+                 rprint(f"[bold red]Markup Error in fix_main:[/bold red]")
+                 rprint(escape(str(e)))
+            else:
+                 # Print other errors normally (might still fail if they contain markup)
+                 rprint(f"[bold red]Error:[/bold red] {str(e)}")
         sys.exit(1)

pdd/fix_verification_errors.py ADDED Viewed

@@ -0,0 +1,285 @@
+import re
+from typing import Dict, Any
+from rich import print as rprint
+from rich.markdown import Markdown
+from .load_prompt_template import load_prompt_template
+from .llm_invoke import llm_invoke
+def fix_verification_errors(
+    program: str,
+    prompt: str,
+    code: str,
+    output: str,
+    strength: float,
+    temperature: float = 0.0,
+    verbose: bool = False,
+) -> Dict[str, Any]:
+    """
+    Identifies and fixes issues in a code module based on verification output.
+    Args:
+        program: The program code that ran the code module.
+        prompt: The prompt used to generate the code module.
+        code: The code module to be fixed.
+        output: The output logs from the program run during verification.
+        strength: The strength (0-1) for the LLM model selection.
+        temperature: The temperature for the LLM model. Defaults to 0.
+        verbose: If True, prints detailed execution information. Defaults to False.
+    Returns:
+        A dictionary containing:
+        - 'explanation': A string with verification details and fix explanation
+                         in XML format, or None if no issues were found.
+        - 'fixed_program': The potentially fixed program code string.
+        - 'fixed_code': The potentially fixed code module string.
+        - 'total_cost': The total cost incurred from LLM calls.
+        - 'model_name': The name of the LLM model used.
+        - 'verification_issues_count': The number of issues found during verification.
+    """
+    total_cost = 0.0
+    model_name = None
+    verification_issues_count = 0
+    verification_details = None
+    fix_explanation = None
+    fixed_program = program
+    fixed_code = code
+    final_explanation = None
+    # Check only essential inputs, allow empty output
+    if not all([program, prompt, code]):
+        # Keep the error print for program, prompt, code missing
+        rprint("[bold red]Error:[/bold red] Missing one or more required inputs (program, prompt, code).")
+        return {
+            "explanation": None,
+            "fixed_program": program, # Return original if possible
+            "fixed_code": code,       # Return original if possible
+            "total_cost": 0.0,
+            "model_name": None,
+            "verification_issues_count": 0,
+        }
+    if not (0.0 <= strength <= 1.0):
+        rprint(f"[bold red]Error:[/bold red] Strength must be between 0.0 and 1.0, got {strength}.")
+        return {
+            "explanation": None,
+            "fixed_program": program,
+            "fixed_code": code,
+            "total_cost": 0.0,
+            "model_name": None,
+            "verification_issues_count": 0,
+        }
+    if verbose:
+        rprint("[blue]Loading prompt templates...[/blue]")
+    try:
+        find_errors_prompt_template = load_prompt_template("find_verification_errors_LLM")
+        fix_errors_prompt_template = load_prompt_template("fix_verification_errors_LLM")
+        if not find_errors_prompt_template or not fix_errors_prompt_template:
+            raise ValueError("One or both prompt templates could not be loaded.")
+    except Exception as e:
+        rprint(f"[bold red]Error loading prompt templates:[/bold red] {e}")
+        return {
+            "explanation": None,
+            "fixed_program": program,
+            "fixed_code": code,
+            "total_cost": total_cost,
+            "model_name": model_name,
+            "verification_issues_count": verification_issues_count,
+        }
+    if verbose:
+        rprint("[green]Prompt templates loaded successfully.[/green]")
+    if verbose:
+        rprint(f"\n[blue]Step 2: Running verification check (Strength: {strength}, Temp: {temperature})...[/blue]")
+    verification_input_json = {
+        "program": program,
+        "prompt": prompt,
+        "code": code,
+        "output": output,
+    }
+    try:
+        verification_response = llm_invoke(
+            prompt=find_errors_prompt_template,
+            input_json=verification_input_json,
+            strength=strength,
+            temperature=temperature,
+            verbose=False, # Keep internal llm_invoke verbose off unless needed
+        )
+        total_cost += verification_response.get('cost', 0.0)
+        model_name = verification_response.get('model_name', model_name)
+        verification_result = verification_response.get('result', '')
+        if verbose:
+            rprint(f"[cyan]Verification LLM call complete.[/cyan]")
+            rprint(f"  [dim]Model Used:[/dim] {verification_response.get('model_name', 'N/A')}")
+            rprint(f"  [dim]Cost:[/dim] ${verification_response.get('cost', 0.0):.6f}")
+    except Exception as e:
+        rprint(f"[bold red]Error during verification LLM call:[/bold red] {e}")
+        return {
+            "explanation": None,
+            "fixed_program": program,
+            "fixed_code": code,
+            "total_cost": total_cost,
+            "model_name": model_name,
+            "verification_issues_count": verification_issues_count,
+        }
+    if verbose:
+        rprint("\n[blue]Verification Result:[/blue]")
+        # Markdown object handles its own rendering, no extra needed here
+        rprint(Markdown(verification_result))
+    issues_found = False
+    try:
+        # Attempt to match and extract digits directly
+        count_match = re.search(r"<issues_count>(\d+)</issues_count>", verification_result)
+        if count_match:
+            verification_issues_count = int(count_match.group(1)) # Safe due to \d+
+        else:
+            # Specific match failed, check if tag exists with invalid content or is missing
+            generic_count_match = re.search(r"<issues_count>(.*?)</issues_count>", verification_result, re.DOTALL)
+            if generic_count_match:
+                # Tag found, but content is not \d+ -> Parsing Error
+                rprint("[bold red]Error:[/bold red] Could not parse integer value from <issues_count> tag.")
+                # Return the specific error structure for parsing errors after verification call
+                return {
+                    "explanation": None,
+                    "fixed_program": program,
+                    "fixed_code": code,
+                    "total_cost": total_cost, # Cost incurred so far
+                    "model_name": model_name, # Model used so far
+                    "verification_issues_count": 0, # Reset count on parsing error
+                }
+            else:
+                # Tag truly not found -> Warning
+                rprint("[yellow]Warning:[/yellow] Could not find <issues_count> tag in verification result. Assuming 0 issues.")
+                verification_issues_count = 0
+        # Proceed to check for details tag if count > 0
+        if verification_issues_count > 0:
+            details_match = re.search(r"<details>(.*?)</details>", verification_result, re.DOTALL)
+            if details_match:
+                verification_details = details_match.group(1).strip()
+                if verification_details:
+                    issues_found = True
+                    if verbose:
+                        rprint(f"\n[yellow]Found {verification_issues_count} potential issues. Proceeding to fix step.[/yellow]")
+                else:
+                    # Count > 0, but details empty -> Warning
+                    rprint("[yellow]Warning:[/yellow] <issues_count> is > 0, but <details> tag is empty. Treating as no issues found.")
+                    verification_issues_count = 0 # Reset count
+            else:
+                # Count > 0, but no details tag -> Warning
+                rprint("[yellow]Warning:[/yellow] <issues_count> is > 0, but could not find <details> tag. Treating as no issues found.")
+                verification_issues_count = 0 # Reset count
+        else:
+            # verification_issues_count is 0 (either parsed as 0 or defaulted after warning)
+            if verbose:
+                rprint("\n[green]No issues found during verification.[/green]")
+    # Removed ValueError catch as it's handled by the logic above
+    except Exception as e:
+        # Generic catch for other potential parsing issues
+        rprint(f"[bold red]Error parsing verification result:[/bold red] {e}")
+        return {
+            "explanation": None,
+            "fixed_program": program,
+            "fixed_code": code,
+            "total_cost": total_cost,
+            "model_name": model_name,
+            "verification_issues_count": 0, # Reset count on parsing error
+        }
+    if issues_found and verification_details:
+        if verbose:
+            rprint(f"\n[blue]Step 5: Running fix generation (Strength: {strength}, Temp: {temperature})...[/blue]")
+        fix_input_json = {
+            "program": program,
+            "prompt": prompt,
+            "code": code,
+            "output": output,
+            "issues": verification_details,
+        }
+        try:
+            fix_response = llm_invoke(
+                prompt=fix_errors_prompt_template,
+                input_json=fix_input_json,
+                strength=strength,
+                temperature=temperature,
+                verbose=False, # Keep internal llm_invoke verbose off unless needed
+            )
+            total_cost += fix_response.get('cost', 0.0)
+            model_name = fix_response.get('model_name', model_name) # Update model name to the last one used
+            fix_result = fix_response.get('result', '')
+            if verbose:
+                rprint(f"[cyan]Fix LLM call complete.[/cyan]")
+                rprint(f"  [dim]Model Used:[/dim] {fix_response.get('model_name', 'N/A')}")
+                rprint(f"  [dim]Cost:[/dim] ${fix_response.get('cost', 0.0):.6f}")
+                rprint("\n[blue]Fix Result:[/blue]")
+                # Markdown object handles its own rendering, no extra needed here
+                rprint(Markdown(fix_result))
+            fixed_program_match = re.search(r"<fixed_program>(.*?)</fixed_program>", fix_result, re.DOTALL)
+            fixed_code_match = re.search(r"<fixed_code>(.*?)</fixed_code>", fix_result, re.DOTALL)
+            explanation_match = re.search(r"<explanation>(.*?)</explanation>", fix_result, re.DOTALL)
+            if fixed_program_match:
+                fixed_program = fixed_program_match.group(1).strip()
+                if verbose: rprint("[green]Extracted fixed program.[/green]")
+            else:
+                if verbose: rprint("[yellow]Warning:[/yellow] Could not find <fixed_program> tag in fix result. Using original program.")
+            if fixed_code_match:
+                fixed_code = fixed_code_match.group(1).strip()
+                if verbose: rprint("[green]Extracted fixed code module.[/green]")
+            else:
+                if verbose: rprint("[yellow]Warning:[/yellow] Could not find <fixed_code> tag in fix result. Using original code module.")
+            if explanation_match:
+                fix_explanation = explanation_match.group(1).strip()
+                if verbose: rprint("[green]Extracted fix explanation.[/green]")
+            else:
+                if verbose: rprint("[yellow]Warning:[/yellow] Could not find <explanation> tag in fix result.")
+                fix_explanation = "[Fix explanation not provided by LLM]"
+        except Exception as e:
+            rprint(f"[bold red]Error during fix LLM call or extraction:[/bold red] {e}")
+            # Combine verification details with the error message if fix failed
+            final_explanation = f"<error>Error during fix generation: {str(e)}</error>\n"
+            if verification_details:
+                fix_explanation = f"[Error during fix generation: {e}]"
+            # Note: verification_issues_count should retain its value from the verification step
+    if verbose:
+        rprint(f"\n[bold blue]Total Cost for fix_verification_errors run:[/bold blue] ${total_cost:.6f}")
+    # Construct final explanation only if issues were initially found and processed
+    if verification_details:
+        if fix_explanation:
+             final_explanation = (
+                 f"<verification_details>{verification_details}</verification_details>\n"
+                 f"<fix_explanation>{fix_explanation}</fix_explanation>"
+             )
+        else:
+             # This case might occur if fix step wasn't run due to parsing issues after verification,
+             # or if fix_explanation extraction failed silently (though we added a default).
+             # Let's ensure we always provide some context if details were found.
+             final_explanation = (
+                 f"<verification_details>{verification_details}</verification_details>\n"
+                 f"<fix_explanation>[Fix explanation not available or fix step skipped]</fix_explanation>"
+             )
+    # If no issues were found initially (verification_details is None), final_explanation remains None
+    return {
+        "explanation": final_explanation,
+        "fixed_program": fixed_program,
+        "fixed_code": fixed_code,
+        "total_cost": total_cost,
+        "model_name": model_name,
+        "verification_issues_count": verification_issues_count,
+    }

pdd-cli 0.0.23__py3-none-any.whl → 0.0.25__py3-none-any.whl

Potentially problematic release.

pdd-cli 0.0.23py3-none-any.whl → 0.0.25py3-none-any.whl