PyPI - pdd-cli - Versions diffs - 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl - Mend

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

pdd/__init__.py +40 -8
pdd/agentic_bug.py +323 -0
pdd/agentic_bug_orchestrator.py +497 -0
pdd/agentic_change.py +231 -0
pdd/agentic_change_orchestrator.py +526 -0
pdd/agentic_common.py +598 -0
pdd/agentic_crash.py +534 -0
pdd/agentic_e2e_fix.py +319 -0
pdd/agentic_e2e_fix_orchestrator.py +426 -0
pdd/agentic_fix.py +1294 -0
pdd/agentic_langtest.py +162 -0
pdd/agentic_update.py +387 -0
pdd/agentic_verify.py +183 -0
pdd/architecture_sync.py +565 -0
pdd/auth_service.py +210 -0
pdd/auto_deps_main.py +71 -51
pdd/auto_include.py +245 -5
pdd/auto_update.py +125 -47
pdd/bug_main.py +196 -23
pdd/bug_to_unit_test.py +2 -0
pdd/change_main.py +11 -4
pdd/cli.py +22 -1181
pdd/cmd_test_main.py +350 -150
pdd/code_generator.py +60 -18
pdd/code_generator_main.py +790 -57
pdd/commands/__init__.py +48 -0
pdd/commands/analysis.py +306 -0
pdd/commands/auth.py +309 -0
pdd/commands/connect.py +290 -0
pdd/commands/fix.py +163 -0
pdd/commands/generate.py +257 -0
pdd/commands/maintenance.py +175 -0
pdd/commands/misc.py +87 -0
pdd/commands/modify.py +256 -0
pdd/commands/report.py +144 -0
pdd/commands/sessions.py +284 -0
pdd/commands/templates.py +215 -0
pdd/commands/utility.py +110 -0
pdd/config_resolution.py +58 -0
pdd/conflicts_main.py +8 -3
pdd/construct_paths.py +589 -111
pdd/context_generator.py +10 -2
pdd/context_generator_main.py +175 -76
pdd/continue_generation.py +53 -10
pdd/core/__init__.py +33 -0
pdd/core/cli.py +527 -0
pdd/core/cloud.py +237 -0
pdd/core/dump.py +554 -0
pdd/core/errors.py +67 -0
pdd/core/remote_session.py +61 -0
pdd/core/utils.py +90 -0
pdd/crash_main.py +262 -33
pdd/data/language_format.csv +71 -63
pdd/data/llm_model.csv +20 -18
pdd/detect_change_main.py +5 -4
pdd/docs/prompting_guide.md +864 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/benchmark_analysis.py +495 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/creation_compare.py +528 -0
pdd/fix_code_loop.py +523 -95
pdd/fix_code_module_errors.py +6 -2
pdd/fix_error_loop.py +491 -92
pdd/fix_errors_from_unit_tests.py +4 -3
pdd/fix_main.py +278 -21
pdd/fix_verification_errors.py +12 -100
pdd/fix_verification_errors_loop.py +529 -286
pdd/fix_verification_main.py +294 -89
pdd/frontend/dist/assets/index-B5DZHykP.css +1 -0
pdd/frontend/dist/assets/index-DQ3wkeQ2.js +449 -0
pdd/frontend/dist/index.html +376 -0
pdd/frontend/dist/logo.svg +33 -0
pdd/generate_output_paths.py +139 -15
pdd/generate_test.py +218 -146
pdd/get_comment.py +19 -44
pdd/get_extension.py +8 -9
pdd/get_jwt_token.py +318 -22
pdd/get_language.py +8 -7
pdd/get_run_command.py +75 -0
pdd/get_test_command.py +68 -0
pdd/git_update.py +70 -19
pdd/incremental_code_generator.py +2 -2
pdd/insert_includes.py +13 -4
pdd/llm_invoke.py +1711 -181
pdd/load_prompt_template.py +19 -12
pdd/path_resolution.py +140 -0
pdd/pdd_completion.fish +25 -2
pdd/pdd_completion.sh +30 -4
pdd/pdd_completion.zsh +79 -4
pdd/postprocess.py +14 -4
pdd/preprocess.py +293 -24
pdd/preprocess_main.py +41 -6
pdd/prompts/agentic_bug_step10_pr_LLM.prompt +182 -0
pdd/prompts/agentic_bug_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_bug_step2_docs_LLM.prompt +129 -0
pdd/prompts/agentic_bug_step3_triage_LLM.prompt +95 -0
pdd/prompts/agentic_bug_step4_reproduce_LLM.prompt +97 -0
pdd/prompts/agentic_bug_step5_root_cause_LLM.prompt +123 -0
pdd/prompts/agentic_bug_step6_test_plan_LLM.prompt +107 -0
pdd/prompts/agentic_bug_step7_generate_LLM.prompt +172 -0
pdd/prompts/agentic_bug_step8_verify_LLM.prompt +119 -0
pdd/prompts/agentic_bug_step9_e2e_test_LLM.prompt +289 -0
pdd/prompts/agentic_change_step10_identify_issues_LLM.prompt +1006 -0
pdd/prompts/agentic_change_step11_fix_issues_LLM.prompt +984 -0
pdd/prompts/agentic_change_step12_create_pr_LLM.prompt +131 -0
pdd/prompts/agentic_change_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_change_step2_docs_LLM.prompt +101 -0
pdd/prompts/agentic_change_step3_research_LLM.prompt +126 -0
pdd/prompts/agentic_change_step4_clarify_LLM.prompt +164 -0
pdd/prompts/agentic_change_step5_docs_change_LLM.prompt +981 -0
pdd/prompts/agentic_change_step6_devunits_LLM.prompt +1005 -0
pdd/prompts/agentic_change_step7_architecture_LLM.prompt +1044 -0
pdd/prompts/agentic_change_step8_analyze_LLM.prompt +1027 -0
pdd/prompts/agentic_change_step9_implement_LLM.prompt +1077 -0
pdd/prompts/agentic_crash_explore_LLM.prompt +49 -0
pdd/prompts/agentic_e2e_fix_step1_unit_tests_LLM.prompt +90 -0
pdd/prompts/agentic_e2e_fix_step2_e2e_tests_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step3_root_cause_LLM.prompt +89 -0
pdd/prompts/agentic_e2e_fix_step4_fix_e2e_tests_LLM.prompt +96 -0
pdd/prompts/agentic_e2e_fix_step5_identify_devunits_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step6_create_unit_tests_LLM.prompt +106 -0
pdd/prompts/agentic_e2e_fix_step7_verify_tests_LLM.prompt +116 -0
pdd/prompts/agentic_e2e_fix_step8_run_pdd_fix_LLM.prompt +120 -0
pdd/prompts/agentic_e2e_fix_step9_verify_all_LLM.prompt +146 -0
pdd/prompts/agentic_fix_explore_LLM.prompt +45 -0
pdd/prompts/agentic_fix_harvest_only_LLM.prompt +48 -0
pdd/prompts/agentic_fix_primary_LLM.prompt +85 -0
pdd/prompts/agentic_update_LLM.prompt +925 -0
pdd/prompts/agentic_verify_explore_LLM.prompt +45 -0
pdd/prompts/auto_include_LLM.prompt +122 -905
pdd/prompts/change_LLM.prompt +3093 -1
pdd/prompts/detect_change_LLM.prompt +686 -27
pdd/prompts/example_generator_LLM.prompt +22 -1
pdd/prompts/extract_code_LLM.prompt +5 -1
pdd/prompts/extract_program_code_fix_LLM.prompt +7 -1
pdd/prompts/extract_prompt_update_LLM.prompt +7 -8
pdd/prompts/extract_promptline_LLM.prompt +17 -11
pdd/prompts/find_verification_errors_LLM.prompt +6 -0
pdd/prompts/fix_code_module_errors_LLM.prompt +12 -2
pdd/prompts/fix_errors_from_unit_tests_LLM.prompt +9 -0
pdd/prompts/fix_verification_errors_LLM.prompt +22 -0
pdd/prompts/generate_test_LLM.prompt +41 -7
pdd/prompts/generate_test_from_example_LLM.prompt +115 -0
pdd/prompts/increase_tests_LLM.prompt +1 -5
pdd/prompts/insert_includes_LLM.prompt +316 -186
pdd/prompts/prompt_code_diff_LLM.prompt +119 -0
pdd/prompts/prompt_diff_LLM.prompt +82 -0
pdd/prompts/trace_LLM.prompt +25 -22
pdd/prompts/unfinished_prompt_LLM.prompt +85 -1
pdd/prompts/update_prompt_LLM.prompt +22 -1
pdd/pytest_output.py +127 -12
pdd/remote_session.py +876 -0
pdd/render_mermaid.py +236 -0
pdd/server/__init__.py +52 -0
pdd/server/app.py +335 -0
pdd/server/click_executor.py +587 -0
pdd/server/executor.py +338 -0
pdd/server/jobs.py +661 -0
pdd/server/models.py +241 -0
pdd/server/routes/__init__.py +31 -0
pdd/server/routes/architecture.py +451 -0
pdd/server/routes/auth.py +364 -0
pdd/server/routes/commands.py +929 -0
pdd/server/routes/config.py +42 -0
pdd/server/routes/files.py +603 -0
pdd/server/routes/prompts.py +1322 -0
pdd/server/routes/websocket.py +473 -0
pdd/server/security.py +243 -0
pdd/server/terminal_spawner.py +209 -0
pdd/server/token_counter.py +222 -0
pdd/setup_tool.py +648 -0
pdd/simple_math.py +2 -0
pdd/split_main.py +3 -2
pdd/summarize_directory.py +237 -195
pdd/sync_animation.py +8 -4
pdd/sync_determine_operation.py +839 -112
pdd/sync_main.py +351 -57
pdd/sync_orchestration.py +1400 -756
pdd/sync_tui.py +848 -0
pdd/template_expander.py +161 -0
pdd/template_registry.py +264 -0
pdd/templates/architecture/architecture_json.prompt +237 -0
pdd/templates/generic/generate_prompt.prompt +174 -0
pdd/trace.py +168 -12
pdd/trace_main.py +4 -3
pdd/track_cost.py +140 -63
pdd/unfinished_prompt.py +51 -4
pdd/update_main.py +567 -67
pdd/update_model_costs.py +2 -2
pdd/update_prompt.py +19 -4
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/METADATA +29 -11
pdd_cli-0.0.118.dist-info/RECORD +227 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/licenses/LICENSE +1 -1
pdd_cli-0.0.45.dist-info/RECORD +0 -116
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/WHEEL +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/entry_points.txt +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/top_level.txt +0 -0

pdd/fix_error_loop.py CHANGED Viewed

@@ -5,14 +5,25 @@ import subprocess
 import shutil
 import json
 from datetime import datetime
+from pathlib import Path
+from typing import Tuple, Optional
+import requests
 from rich import print as rprint
 from rich.console import Console
+from rich.panel import Panel
 # Relative import from an internal module.
+from .get_language import get_language
 from .fix_errors_from_unit_tests import fix_errors_from_unit_tests
-from . import DEFAULT_TIME # Import DEFAULT_TIME
+from . import DEFAULT_TIME  # Import DEFAULT_TIME
 from .python_env_detector import detect_host_python_executable
+from .agentic_fix import run_agentic_fix
+from .agentic_langtest import default_verify_cmd_for
+from .core.cloud import CloudConfig
+# Cloud request timeout for LLM calls
+CLOUD_FIX_TIMEOUT = 400  # seconds
 console = Console()
@@ -20,44 +31,190 @@ def escape_brackets(text: str) -> str:
     """Escape square brackets so Rich doesn't misinterpret them."""
     return text.replace("[", "\\[").replace("]", "\\]")
-def run_pytest_on_file(test_file: str) -> tuple[int, int, int, str]:
+def cloud_fix_errors(
+    unit_test: str,
+    code: str,
+    prompt: str,
+    error: str,
+    error_file: str,
+    strength: float,
+    temperature: float,
+    verbose: bool = False,
+    time: float = DEFAULT_TIME,
+    code_file_ext: str = ".py"
+) -> Tuple[bool, bool, str, str, str, float, str]:
     """
-    Run pytest on the specified test file using subprocess.
-    Returns a tuple: (failures, errors, warnings, logs)
+    Call the cloud fixCode endpoint to fix errors in code and unit tests.
+    This function has the same interface as fix_errors_from_unit_tests to allow
+    seamless switching between local and cloud execution in the fix loop.
+    Args:
+        unit_test: Unit test code string
+        code: Source code string
+        prompt: Prompt that generated the code
+        error: Error messages/logs from test failures
+        error_file: Path to write error analysis (not used in cloud, but kept for interface compatibility)
+        strength: Model strength parameter [0,1]
+        temperature: Model temperature parameter [0,1]
+        verbose: Enable verbose logging
+        time: Time budget for thinking effort
+        code_file_ext: File extension to determine language (e.g., ".py", ".java")
+    Returns:
+        Tuple of:
+        - update_unit_test: Whether unit test was updated
+        - update_code: Whether code was updated
+        - fixed_unit_test: Fixed unit test code
+        - fixed_code: Fixed source code
+        - analysis: Analysis/explanation of fixes
+        - total_cost: Cost of the operation
+        - model_name: Name of model used
+    Raises:
+        RuntimeError: When cloud execution fails with non-recoverable error
     """
+    jwt_token = CloudConfig.get_jwt_token(verbose=verbose)
+    if not jwt_token:
+        raise RuntimeError("Cloud authentication failed - no JWT token available")
+    # Build cloud payload
+    payload = {
+        "unitTest": unit_test,
+        "code": code,
+        "prompt": prompt,
+        "errors": error,
+        "language": get_language(code_file_ext),
+        "strength": strength,
+        "temperature": temperature,
+        "time": time if time is not None else 0.25,
+        "verbose": verbose,
+    }
+    headers = {
+        "Authorization": f"Bearer {jwt_token}",
+        "Content-Type": "application/json"
+    }
+    cloud_url = CloudConfig.get_endpoint_url("fixCode")
+    if verbose:
+        console.print(Panel(f"Calling cloud fix at {cloud_url}", title="[blue]Cloud LLM[/blue]", expand=False))
     try:
-        # Include "--json-only" to ensure only valid JSON is printed.
-        # Use environment-aware Python executable for pytest execution
-        python_executable = detect_host_python_executable()
-        cmd = [python_executable, "-m", "pdd.pytest_output", "--json-only", test_file]
-        result = subprocess.run(cmd, capture_output=True, text=True)
-        # Parse the JSON output from stdout
-        try:
-            output = json.loads(result.stdout)
-            test_results = output.get('test_results', [{}])[0]
-            # Check pytest's return code first
-            return_code = test_results.get('return_code', 1)
-            failures = test_results.get('failures', 0)
-            errors = test_results.get('errors', 0)
-            warnings = test_results.get('warnings', 0)
+        response = requests.post(
+            cloud_url,
+            json=payload,
+            headers=headers,
+            timeout=CLOUD_FIX_TIMEOUT
+        )
+        response.raise_for_status()
-            if return_code == 2:
-                errors += 1
-            # Combine stdout and stderr from the test results
-            logs = test_results.get('standard_output', '') + '\n' + test_results.get('standard_error', '')
-            return failures, errors, warnings, logs
-        except json.JSONDecodeError:
-            # If JSON parsing fails, return the raw output
-            return 1, 1, 0, f"Failed to parse pytest output:\n{result.stdout}\n{result.stderr}"
-    except Exception as e:
-        return 1, 1, 0, f"Error running pytest: {str(e)}"
+        response_data = response.json()
+        fixed_unit_test = response_data.get("fixedUnitTest", "")
+        fixed_code = response_data.get("fixedCode", "")
+        analysis = response_data.get("analysis", "")
+        total_cost = float(response_data.get("totalCost", 0.0))
+        model_name = response_data.get("modelName", "cloud_model")
+        update_unit_test = response_data.get("updateUnitTest", False)
+        update_code = response_data.get("updateCode", False)
+        if verbose:
+            console.print(f"[cyan]Cloud fix completed. Model: {model_name}, Cost: ${total_cost:.6f}[/cyan]")
+        return update_unit_test, update_code, fixed_unit_test, fixed_code, analysis, total_cost, model_name
+    except requests.exceptions.Timeout:
+        raise RuntimeError(f"Cloud fix timed out after {CLOUD_FIX_TIMEOUT}s")
+    except requests.exceptions.HTTPError as e:
+        status_code = e.response.status_code if e.response else 0
+        err_content = e.response.text[:200] if e.response else "No response content"
+        # Non-recoverable errors
+        if status_code == 402:
+            try:
+                error_data = e.response.json()
+                current_balance = error_data.get("currentBalance", "unknown")
+                estimated_cost = error_data.get("estimatedCost", "unknown")
+                raise RuntimeError(f"Insufficient credits. Balance: {current_balance}, estimated cost: {estimated_cost}")
+            except json.JSONDecodeError:
+                raise RuntimeError(f"Insufficient credits: {err_content}")
+        elif status_code == 401:
+            raise RuntimeError(f"Authentication failed: {err_content}")
+        elif status_code == 403:
+            raise RuntimeError(f"Access denied: {err_content}")
+        elif status_code == 400:
+            raise RuntimeError(f"Invalid request: {err_content}")
+        else:
+            # 5xx or other errors - raise for caller to handle
+            raise RuntimeError(f"Cloud HTTP error ({status_code}): {err_content}")
+    except requests.exceptions.RequestException as e:
+        raise RuntimeError(f"Cloud network error: {e}")
+    except json.JSONDecodeError:
+        raise RuntimeError("Cloud returned invalid JSON response")
+# ---------- Normalize any agentic return shape to a 4-tuple ----------
+def _normalize_agentic_result(result):
+    """
+    Normalize run_agentic_fix result into: (success: bool, msg: str, cost: float, model: str, changed_files: List[str])
+    Handles older 2/3/4-tuple shapes used by tests/monkeypatches.
+    """
+    if isinstance(result, tuple):
+        if len(result) == 5:
+            ok, msg, cost, model, changed_files = result
+            return bool(ok), str(msg), float(cost), str(model or "agentic-cli"), list(changed_files or [])
+        if len(result) == 4:
+            ok, msg, cost, model = result
+            return bool(ok), str(msg), float(cost), str(model or "agentic-cli"), []
+        if len(result) == 3:
+            ok, msg, cost = result
+            return bool(ok), str(msg), float(cost), "agentic-cli", []
+        if len(result) == 2:
+            ok, msg = result
+            return bool(ok), str(msg), 0.0, "agentic-cli", []
+    # Fallback (shouldn't happen)
+    return False, "Invalid agentic result shape", 0.0, "agentic-cli", []
+def _safe_run_agentic_fix(*, prompt_file, code_file, unit_test_file, error_log_file, cwd=None):
+    """
+    Call (possibly monkeypatched) run_agentic_fix and normalize its return.
+    """
+    res = run_agentic_fix(
+        prompt_file=prompt_file,
+        code_file=code_file,
+        unit_test_file=unit_test_file,
+        error_log_file=error_log_file,
+        cwd=cwd,
+    )
+    return _normalize_agentic_result(res)
+# ---------------------------------------------------------------------
+def run_pytest_on_file(test_file: str) -> tuple[int, int, int, str]:
+    """
+    Run pytest on the specified test file using the subprocess-based runner.
+    Returns a tuple: (failures, errors, warnings, logs)
+    """
+    from .pytest_output import run_pytest_and_capture_output
+    # Use the subprocess-based runner to avoid module caching issues
+    output_data = run_pytest_and_capture_output(test_file)
+    # Extract results
+    results = output_data.get("test_results", [{}])[0]
+    failures = results.get("failures", 0)
+    errors = results.get("errors", 0)
+    warnings = results.get("warnings", 0)
+    # Combine stdout/stderr for the log
+    logs = (results.get("standard_output", "") or "") + "\n" + (results.get("standard_error", "") or "")
+    return failures, errors, warnings, logs
 def format_log_for_output(log_structure):
     """
@@ -77,6 +234,8 @@ def format_log_for_output(log_structure):
         # Fix attempt with XML tags
         if iteration.get("fix_attempt"):
             formatted_text += f"<fix_attempt iteration={iteration['number']}>\n"
+            if iteration.get("model_name"):
+                formatted_text += f"Model: {iteration['model_name']}\n"
             formatted_text += f"{iteration['fix_attempt']}\n"
             formatted_text += "</fix_attempt>\n\n"
@@ -101,6 +260,7 @@ def format_log_for_output(log_structure):
 def fix_error_loop(unit_test_file: str,
                    code_file: str,
+                   prompt_file: str,
                    prompt: str,
                    verification_program: str,
                    strength: float,
@@ -109,15 +269,22 @@ def fix_error_loop(unit_test_file: str,
                    budget: float,
                    error_log_file: str = "error_log.txt",
                    verbose: bool = False,
-                   time: float = DEFAULT_TIME):
+                   time: float = DEFAULT_TIME,
+                   agentic_fallback: bool = True,
+                   use_cloud: bool = False):
     """
-    Attempt to fix errors in a unit test and corresponding code using repeated iterations,
-    counting only the number of times we actually call the LLM fix function.
+    Attempt to fix errors in a unit test and corresponding code using repeated iterations,
+    counting only the number of times we actually call the LLM fix function.
     The tests are re-run in the same iteration after a fix to see if we've succeeded,
     so that 'attempts' matches the number of fix attempts (not the total test runs).
     This updated version uses structured logging to avoid redundant entries.
+    Hybrid Cloud Support:
+        When use_cloud=True, the LLM fix calls are routed to the cloud fixCode endpoint
+        while local test execution (pytest, verification programs) stays local. This allows
+        the loop to pass local test results to the cloud for analysis and fixes.
     Inputs:
         unit_test_file: Path to the file containing unit tests.
         code_file: Path to the file containing the code under test.
@@ -130,7 +297,8 @@ def fix_error_loop(unit_test_file: str,
         error_log_file: Path to file to log errors (default: "error_log.txt").
         verbose: Enable verbose logging (default: False).
         time: Time parameter for the fix_errors_from_unit_tests call.
+        agentic_fallback: Whether to trigger cli agentic fallback when fix fails.
+        use_cloud: If True, use cloud LLM for fix calls while keeping test execution local.
     Outputs:
         success: Boolean indicating if the overall process succeeded.
         final_unit_test: String contents of the final unit test file.
@@ -185,9 +353,63 @@ def fix_error_loop(unit_test_file: str,
     # We do up to max_attempts fix attempts or until budget is exceeded
     iteration = 0
+    # Determine if target is Python (moved before try block for use in exception handler)
+    is_python = str(code_file).lower().endswith(".py")
     # Run an initial test to determine starting state
     try:
-        initial_fails, initial_errors, initial_warnings, pytest_output = run_pytest_on_file(unit_test_file)
+        if is_python:
+            initial_fails, initial_errors, initial_warnings, pytest_output = run_pytest_on_file(unit_test_file)
+        else:
+            # For non-Python files, run the verification program to get an initial error state
+            rprint(f"[cyan]Non-Python target detected. Running verification program to get initial state...[/cyan]")
+            lang = get_language(os.path.splitext(code_file)[1])
+            verify_cmd = default_verify_cmd_for(lang, unit_test_file)
+            if not verify_cmd:
+                # No verify command available (e.g., Java without maven/gradle).
+                # Trigger agentic fallback directly.
+                rprint(f"[cyan]No verification command for {lang}. Triggering agentic fallback directly...[/cyan]")
+                error_log_path = Path(error_log_file)
+                error_log_path.parent.mkdir(parents=True, exist_ok=True)
+                if not error_log_path.exists() or error_log_path.stat().st_size == 0:
+                    with open(error_log_path, "w") as f:
+                        f.write(f"No verification command available for language: {lang}\n")
+                        f.write("Agentic fix will attempt to resolve the issue.\n")
+                rprint(f"[cyan]Attempting agentic fix fallback (prompt_file={prompt_file!r})...[/cyan]")
+                success, agent_msg, agent_cost, agent_model, agent_changed_files = _safe_run_agentic_fix(
+                    prompt_file=prompt_file,
+                    code_file=code_file,
+                    unit_test_file=unit_test_file,
+                    error_log_file=error_log_file,
+                    cwd=None,  # Use project root (cwd), not prompt file's parent
+                )
+                if not success:
+                    rprint(f"[bold red]Agentic fix fallback failed: {agent_msg}[/bold red]")
+                if agent_changed_files:
+                    rprint(f"[cyan]Agent modified {len(agent_changed_files)} file(s):[/cyan]")
+                    for f in agent_changed_files:
+                        rprint(f"  • {f}")
+                final_unit_test = ""
+                final_code = ""
+                try:
+                    with open(unit_test_file, "r") as f:
+                        final_unit_test = f.read()
+                except Exception:
+                    pass
+                try:
+                    with open(code_file, "r") as f:
+                        final_code = f.read()
+                except Exception:
+                    pass
+                return success, final_unit_test, final_code, 1, agent_cost, agent_model
+            verify_result = subprocess.run(verify_cmd, capture_output=True, text=True, shell=True, stdin=subprocess.DEVNULL)
+            pytest_output = (verify_result.stdout or "") + "\n" + (verify_result.stderr or "")
+            if verify_result.returncode == 0:
+                initial_fails, initial_errors, initial_warnings = 0, 0, 0
+            else:
+                initial_fails, initial_errors, initial_warnings = 1, 0, 0 # Treat any failure as one "fail"
         # Store initial state for statistics
         stats = {
             "initial_fails": initial_fails,
@@ -200,14 +422,98 @@ def fix_error_loop(unit_test_file: str,
             "iterations_info": []
         }
     except Exception as e:
-        rprint(f"[red]Error running initial pytest:[/red] {e}")
-        return False, "", "", fix_attempts, total_cost, model_name
+        rprint(f"[red]Error running initial test/verification:[/red] {e}")
+        # Instead of returning early, trigger agentic fallback if enabled (Issue #266)
+        if agentic_fallback:
+            rprint("[cyan]Initial test failed with exception. Triggering agentic fallback...[/cyan]")
+            error_log_path = Path(error_log_file)
+            error_log_path.parent.mkdir(parents=True, exist_ok=True)
+            with open(error_log_path, "w") as f:
+                f.write(f"Initial test/verification failed with exception:\n{e}\n")
+            success, agent_msg, agent_cost, agent_model, agent_changed_files = _safe_run_agentic_fix(
+                prompt_file=prompt_file,
+                code_file=code_file,
+                unit_test_file=unit_test_file,
+                error_log_file=error_log_file,
+                cwd=None,
+            )
+            if not success:
+                rprint(f"[bold red]Agentic fix fallback failed: {agent_msg}[/bold red]")
+            if agent_changed_files:
+                rprint(f"[cyan]Agent modified {len(agent_changed_files)} file(s):[/cyan]")
+                for f in agent_changed_files:
+                    rprint(f"  • {f}")
+            final_unit_test = ""
+            final_code = ""
+            try:
+                with open(unit_test_file, "r") as f:
+                    final_unit_test = f.read()
+            except Exception:
+                pass
+            try:
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception:
+                pass
+            return success, final_unit_test, final_code, 1, agent_cost, agent_model
+        else:
+            # Agentic fallback disabled, return failure
+            return False, "", "", fix_attempts, total_cost, model_name
+    # If target is not a Python file, trigger agentic fallback if tests fail
+    if not is_python:
+        if initial_fails > 0 or initial_errors > 0:
+            rprint("[cyan]Non-Python target failed initial verification. Triggering agentic fallback...[/cyan]")
+            error_log_path = Path(error_log_file)
+            error_log_path.parent.mkdir(parents=True, exist_ok=True)
+            with open(error_log_path, "w") as f:
+                f.write(pytest_output)
+            rprint(f"[cyan]Attempting agentic fix fallback (prompt_file={prompt_file!r})...[/cyan]")
+            success, agent_msg, agent_cost, agent_model, agent_changed_files = _safe_run_agentic_fix(
+                prompt_file=prompt_file,
+                code_file=code_file,
+                unit_test_file=unit_test_file,
+                error_log_file=error_log_file,
+                cwd=None,  # Use project root (cwd), not prompt file's parent
+            )
+            if not success:
+                rprint(f"[bold red]Agentic fix fallback failed: {agent_msg}[/bold red]")
+            if agent_changed_files:
+                rprint(f"[cyan]Agent modified {len(agent_changed_files)} file(s):[/cyan]")
+                for f in agent_changed_files:
+                    rprint(f"  • {f}")
+            final_unit_test = ""
+            final_code = ""
+            try:
+                with open(unit_test_file, "r") as f:
+                    final_unit_test = f.read()
+            except Exception:
+                pass
+            try:
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception:
+                pass
+            return success, final_unit_test, final_code, 1, agent_cost, agent_model
+        else:
+            # Non-python tests passed, so we are successful.
+            rprint("[green]Non-Python tests passed. No fix needed.[/green]")
+            try:
+                with open(unit_test_file, "r") as f:
+                    final_unit_test = f.read()
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception as e:
+                rprint(f"[yellow]Warning: Could not read final files: {e}[/yellow]")
+            return True, final_unit_test, final_code, 0, 0.0, "N/A"
     fails, errors, warnings = initial_fails, initial_errors, initial_warnings
     # Determine success state immediately
     success = (fails == 0 and errors == 0 and warnings == 0)
     # Track if tests were initially passing
     initially_passing = success
@@ -244,13 +550,23 @@ def fix_error_loop(unit_test_file: str,
             # Update structured log
             log_structure["iterations"][-1]["post_test_output"] = pytest_output
             # Write formatted log to file
-            with open(error_log_file, "w") as elog:
+            error_log_path = Path(error_log_file)
+            error_log_path.parent.mkdir(parents=True, exist_ok=True)
+            with open(error_log_path, "w") as elog:
                 elog.write(format_log_for_output(log_structure))
             # Set success to True (already determined)
-            # No need to read the files - keep empty strings for passing cases
+            # Read the actual fixed files to return the successful state
+            try:
+                with open(unit_test_file, "r") as f:
+                    final_unit_test = f.read()
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception as e:
+                rprint(f"[yellow]Warning: Could not read fixed files: {e}[/yellow]")
+                # Keep empty strings as fallback
             break
         iteration_header = f"=== Attempt iteration {iteration} ==="
@@ -280,17 +596,18 @@ def fix_error_loop(unit_test_file: str,
             break
         # We only attempt to fix if test is failing or has warnings:
-        # Let's create backups:
-        unit_test_dir, unit_test_name = os.path.split(unit_test_file)
-        code_dir, code_name = os.path.split(code_file)
-        unit_test_backup = os.path.join(
-            unit_test_dir,
-            f"{os.path.splitext(unit_test_name)[0]}_{iteration}_{errors}_{fails}_{warnings}_{timestamp}.py"
-        )
-        code_backup = os.path.join(
-            code_dir,
-            f"{os.path.splitext(code_name)[0]}_{iteration}_{errors}_{fails}_{warnings}_{timestamp}.py"
-        )
+        # Let's create backups in .pdd/backups/ to avoid polluting code/test directories
+        code_name = os.path.basename(code_file)
+        code_basename = os.path.splitext(code_name)[0]
+        unit_test_name = os.path.basename(unit_test_file)
+        unit_test_ext = os.path.splitext(unit_test_name)[1]
+        code_ext = os.path.splitext(code_name)[1]
+        backup_dir = Path.cwd() / '.pdd' / 'backups' / code_basename / timestamp
+        backup_dir.mkdir(parents=True, exist_ok=True)
+        unit_test_backup = str(backup_dir / f"test_{iteration}_{errors}_{fails}_{warnings}{unit_test_ext}")
+        code_backup = str(backup_dir / f"code_{iteration}_{errors}_{fails}_{warnings}{code_ext}")
         try:
             shutil.copy(unit_test_file, unit_test_backup)
             shutil.copy(code_file, code_backup)
@@ -299,7 +616,8 @@ def fix_error_loop(unit_test_file: str,
                 rprint(f"[green]Created backup for code file:[/green] {code_backup}")
         except Exception as e:
             rprint(f"[red]Error creating backup files:[/red] {e}")
-            return False, "", "", fix_attempts, total_cost, model_name
+            success = False
+            break  # Exit loop but continue to agentic fallback (Issue #266)
         # Update best iteration if needed:
         if (errors < best_iteration_info["errors"] or
@@ -322,29 +640,67 @@ def fix_error_loop(unit_test_file: str,
                 code_contents = f.read()
         except Exception as e:
             rprint(f"[red]Error reading input files:[/red] {e}")
-            return False, "", "", fix_attempts, total_cost, model_name
+            success = False
+            break  # Exit loop but continue to agentic fallback (Issue #266)
-        # Call fix:
+        # Call fix (cloud or local based on use_cloud parameter):
         try:
-            # Format the log for the LLM
+            # Format the log for the LLM - includes local test results
             formatted_log = format_log_for_output(log_structure)
-            updated_unit_test, updated_code, fixed_unit_test, fixed_code, analysis, cost, model_name = fix_errors_from_unit_tests(
-                unit_test_contents,
-                code_contents,
-                prompt,
-                formatted_log,  # Use formatted log instead of reading the file
-                error_log_file,
-                strength,
-                temperature,
-                verbose=verbose,
-                time=time # Pass time parameter
-            )
+            if use_cloud:
+                # Use cloud LLM for fix - local test results passed via formatted_log
+                try:
+                    updated_unit_test, updated_code, fixed_unit_test, fixed_code, analysis, cost, model_name = cloud_fix_errors(
+                        unit_test=unit_test_contents,
+                        code=code_contents,
+                        prompt=prompt,
+                        error=formatted_log,  # Pass local test results to cloud
+                        error_file=error_log_file,
+                        strength=strength,
+                        temperature=temperature,
+                        verbose=verbose,
+                        time=time,
+                        code_file_ext=os.path.splitext(code_file)[1]
+                    )
+                except RuntimeError as cloud_err:
+                    # Cloud failed - fall back to local if it's a recoverable error
+                    if "Insufficient credits" in str(cloud_err) or "Authentication failed" in str(cloud_err) or "Access denied" in str(cloud_err):
+                        # Non-recoverable errors - stop the loop
+                        rprint(f"[red]Cloud fix error (non-recoverable):[/red] {cloud_err}")
+                        break
+                    # Recoverable errors - fall back to local
+                    rprint(f"[yellow]Cloud fix failed, falling back to local:[/yellow] {cloud_err}")
+                    updated_unit_test, updated_code, fixed_unit_test, fixed_code, analysis, cost, model_name = fix_errors_from_unit_tests(
+                        unit_test_contents,
+                        code_contents,
+                        prompt,
+                        formatted_log,
+                        error_log_file,
+                        strength,
+                        temperature,
+                        verbose=verbose,
+                        time=time
+                    )
+            else:
+                # Use local LLM for fix
+                updated_unit_test, updated_code, fixed_unit_test, fixed_code, analysis, cost, model_name = fix_errors_from_unit_tests(
+                    unit_test_contents,
+                    code_contents,
+                    prompt,
+                    formatted_log,  # Use formatted log instead of reading the file
+                    error_log_file,
+                    strength,
+                    temperature,
+                    verbose=verbose,
+                    time=time  # Pass time parameter
+                )
             # Update the fix attempt in the structured log
             log_structure["iterations"][-1]["fix_attempt"] = analysis
+            log_structure["iterations"][-1]["model_name"] = model_name
         except Exception as e:
-            rprint(f"[red]Error during fix_errors_from_unit_tests call:[/red] {e}")
+            rprint(f"[red]Error during fix call:[/red] {e}")
             break
         fix_attempts += 1  # We used one fix attempt
@@ -384,7 +740,7 @@ def fix_error_loop(unit_test_file: str,
             # Run the verification:
             try:
                 verify_cmd = [detect_host_python_executable(), verification_program]
-                verify_result = subprocess.run(verify_cmd, capture_output=True, text=True)
+                verify_result = subprocess.run(verify_cmd, capture_output=True, text=True, stdin=subprocess.DEVNULL)
                 # Safely handle None for stdout or stderr:
                 verify_stdout = verify_result.stdout or ""
                 verify_stderr = verify_result.stderr or ""
@@ -414,9 +770,11 @@ def fix_error_loop(unit_test_file: str,
             # Update post-test output in structured log
             log_structure["iterations"][-1]["post_test_output"] = pytest_output
             # Write updated structured log to file after each iteration
-            with open(error_log_file, "w") as elog:
+            error_log_path = Path(error_log_file)
+            error_log_path.parent.mkdir(parents=True, exist_ok=True)
+            with open(error_log_path, "w") as elog:
                 elog.write(format_log_for_output(log_structure))
             # Update iteration stats with post-fix results
@@ -438,7 +796,8 @@ def fix_error_loop(unit_test_file: str,
             stats["final_warnings"] = warnings
         except Exception as e:
             rprint(f"[red]Error running pytest for next iteration:[/red] {e}")
-            return False, "", "", fix_attempts, total_cost, model_name
+            success = False
+            break  # Exit loop but continue to agentic fallback (Issue #266)
     # Possibly restore best iteration if the final run is not as good:
     if best_iteration_info["attempt"] is not None and not success:
@@ -480,8 +839,8 @@ def fix_error_loop(unit_test_file: str,
     else:
         stats["best_iteration"] = "final"
-    # Read final file contents, but only if tests weren't initially passing
-    # For initially passing tests, keep empty strings as required by the test
+    # Read final file contents for non-initially-passing tests
+    # (Initially passing tests have files read at lines 344-348)
     try:
         if not initially_passing:
             with open(unit_test_file, "r") as f:
@@ -492,11 +851,6 @@ def fix_error_loop(unit_test_file: str,
         rprint(f"[red]Error reading final files:[/red] {e}")
         final_unit_test, final_code = "", ""
-    # Check if we broke out early because tests already passed
-    if stats["best_iteration"] == 0 and fix_attempts == 0:
-        # Still return at least 1 attempt to acknowledge the work done
-        fix_attempts = 1
     # Print summary statistics
     rprint("\n[bold cyan]Summary Statistics:[/bold cyan]")
     rprint(f"Initial state: {initial_fails} fails, {initial_errors} errors, {initial_warnings} warnings")
@@ -506,17 +860,62 @@ def fix_error_loop(unit_test_file: str,
     # Calculate improvements
     stats["improvement"] = {
-        "fails_reduced": initial_fails - stats["final_fails"],
-        "errors_reduced": initial_errors - stats["final_errors"],
-        "warnings_reduced": initial_warnings - stats["final_warnings"],
-        "percent_improvement": 100 if initial_fails + initial_errors + initial_warnings == 0 else
-                              (1 - (stats["final_fails"] + stats["final_errors"] + stats["final_warnings"]) /
+        "fails_reduced": initial_fails - stats['final_fails'],
+        "errors_reduced": initial_errors - stats['final_errors'],
+        "warnings_reduced": initial_warnings - stats['final_warnings'],
+        "percent_improvement": 100 if (initial_fails + initial_errors + initial_warnings) == 0 else
+                              (1 - (stats['final_fails'] + stats['final_errors'] + stats['final_warnings']) /
                                    (initial_fails + initial_errors + initial_warnings)) * 100
     }
     rprint(f"Improvement: {stats['improvement']['fails_reduced']} fails, {stats['improvement']['errors_reduced']} errors, {stats['improvement']['warnings_reduced']} warnings")
     rprint(f"Overall improvement: {stats['improvement']['percent_improvement']:.2f}%")
+    # Agentic fallback at end adds cost & model (normalized)
+    if not success and agentic_fallback and total_cost < budget:
+        # Ensure error_log_file exists before calling agentic fix
+        # Write the current log structure if it hasn't been written yet
+        try:
+            if not os.path.exists(error_log_file) or os.path.getsize(error_log_file) == 0:
+                error_log_path = Path(error_log_file)
+                error_log_path.parent.mkdir(parents=True, exist_ok=True)
+                with open(error_log_path, "w") as elog:
+                    if log_structure["iterations"]:
+                        elog.write(format_log_for_output(log_structure))
+                    else:
+                        # No iterations ran, write initial state info
+                        elog.write(f"Initial state: {initial_fails} fails, {initial_errors} errors, {initial_warnings} warnings\n")
+                        if 'pytest_output' in locals():
+                            elog.write(f"\n<pytest_output>\n{pytest_output}\n</pytest_output>\n")
+        except Exception as e:
+            rprint(f"[yellow]Warning: Could not write error log before agentic fallback: {e}[/yellow]")
+        rprint(f"[cyan]Attempting agentic fix fallback (prompt_file={prompt_file!r})...[/cyan]")
+        agent_success, agent_msg, agent_cost, agent_model, agent_changed_files = _safe_run_agentic_fix(
+            prompt_file=prompt_file,
+            code_file=code_file,
+            unit_test_file=unit_test_file,
+            error_log_file=error_log_file,
+            cwd=None,  # Use project root (cwd), not prompt file's parent
+        )
+        total_cost += agent_cost
+        if not agent_success:
+            rprint(f"[bold red]Agentic fix fallback failed: {agent_msg}[/bold red]")
+        if agent_changed_files:
+            rprint(f"[cyan]Agent modified {len(agent_changed_files)} file(s):[/cyan]")
+            for f in agent_changed_files:
+                rprint(f"  • {f}")
+        if agent_success:
+            model_name = agent_model or model_name
+            try:
+                with open(unit_test_file, "r") as f:
+                    final_unit_test = f.read()
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception as e:
+                rprint(f"[yellow]Warning: Could not read files after successful agentic fix: {e}[/yellow]")
+            success = True
     return success, final_unit_test, final_code, fix_attempts, total_cost, model_name
 # If this module is run directly for testing purposes:
@@ -551,4 +950,4 @@ if __name__ == "__main__":
     rprint(f"Attempts: {attempts}")
     rprint(f"Total cost: ${total_cost:.6f}")
     rprint(f"Model used: {model_name}")
-    rprint(f"Final unit test contents:\n{final_unit_test}")
+    rprint(f"Final unit test contents:\n{final_unit_test}")

pdd-cli 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl