PyPI - pdd-cli - Versions diffs - 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl - Mend

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

pdd/__init__.py +40 -8
pdd/agentic_bug.py +323 -0
pdd/agentic_bug_orchestrator.py +497 -0
pdd/agentic_change.py +231 -0
pdd/agentic_change_orchestrator.py +526 -0
pdd/agentic_common.py +598 -0
pdd/agentic_crash.py +534 -0
pdd/agentic_e2e_fix.py +319 -0
pdd/agentic_e2e_fix_orchestrator.py +426 -0
pdd/agentic_fix.py +1294 -0
pdd/agentic_langtest.py +162 -0
pdd/agentic_update.py +387 -0
pdd/agentic_verify.py +183 -0
pdd/architecture_sync.py +565 -0
pdd/auth_service.py +210 -0
pdd/auto_deps_main.py +71 -51
pdd/auto_include.py +245 -5
pdd/auto_update.py +125 -47
pdd/bug_main.py +196 -23
pdd/bug_to_unit_test.py +2 -0
pdd/change_main.py +11 -4
pdd/cli.py +22 -1181
pdd/cmd_test_main.py +350 -150
pdd/code_generator.py +60 -18
pdd/code_generator_main.py +790 -57
pdd/commands/__init__.py +48 -0
pdd/commands/analysis.py +306 -0
pdd/commands/auth.py +309 -0
pdd/commands/connect.py +290 -0
pdd/commands/fix.py +163 -0
pdd/commands/generate.py +257 -0
pdd/commands/maintenance.py +175 -0
pdd/commands/misc.py +87 -0
pdd/commands/modify.py +256 -0
pdd/commands/report.py +144 -0
pdd/commands/sessions.py +284 -0
pdd/commands/templates.py +215 -0
pdd/commands/utility.py +110 -0
pdd/config_resolution.py +58 -0
pdd/conflicts_main.py +8 -3
pdd/construct_paths.py +589 -111
pdd/context_generator.py +10 -2
pdd/context_generator_main.py +175 -76
pdd/continue_generation.py +53 -10
pdd/core/__init__.py +33 -0
pdd/core/cli.py +527 -0
pdd/core/cloud.py +237 -0
pdd/core/dump.py +554 -0
pdd/core/errors.py +67 -0
pdd/core/remote_session.py +61 -0
pdd/core/utils.py +90 -0
pdd/crash_main.py +262 -33
pdd/data/language_format.csv +71 -63
pdd/data/llm_model.csv +20 -18
pdd/detect_change_main.py +5 -4
pdd/docs/prompting_guide.md +864 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/benchmark_analysis.py +495 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/creation_compare.py +528 -0
pdd/fix_code_loop.py +523 -95
pdd/fix_code_module_errors.py +6 -2
pdd/fix_error_loop.py +491 -92
pdd/fix_errors_from_unit_tests.py +4 -3
pdd/fix_main.py +278 -21
pdd/fix_verification_errors.py +12 -100
pdd/fix_verification_errors_loop.py +529 -286
pdd/fix_verification_main.py +294 -89
pdd/frontend/dist/assets/index-B5DZHykP.css +1 -0
pdd/frontend/dist/assets/index-DQ3wkeQ2.js +449 -0
pdd/frontend/dist/index.html +376 -0
pdd/frontend/dist/logo.svg +33 -0
pdd/generate_output_paths.py +139 -15
pdd/generate_test.py +218 -146
pdd/get_comment.py +19 -44
pdd/get_extension.py +8 -9
pdd/get_jwt_token.py +318 -22
pdd/get_language.py +8 -7
pdd/get_run_command.py +75 -0
pdd/get_test_command.py +68 -0
pdd/git_update.py +70 -19
pdd/incremental_code_generator.py +2 -2
pdd/insert_includes.py +13 -4
pdd/llm_invoke.py +1711 -181
pdd/load_prompt_template.py +19 -12
pdd/path_resolution.py +140 -0
pdd/pdd_completion.fish +25 -2
pdd/pdd_completion.sh +30 -4
pdd/pdd_completion.zsh +79 -4
pdd/postprocess.py +14 -4
pdd/preprocess.py +293 -24
pdd/preprocess_main.py +41 -6
pdd/prompts/agentic_bug_step10_pr_LLM.prompt +182 -0
pdd/prompts/agentic_bug_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_bug_step2_docs_LLM.prompt +129 -0
pdd/prompts/agentic_bug_step3_triage_LLM.prompt +95 -0
pdd/prompts/agentic_bug_step4_reproduce_LLM.prompt +97 -0
pdd/prompts/agentic_bug_step5_root_cause_LLM.prompt +123 -0
pdd/prompts/agentic_bug_step6_test_plan_LLM.prompt +107 -0
pdd/prompts/agentic_bug_step7_generate_LLM.prompt +172 -0
pdd/prompts/agentic_bug_step8_verify_LLM.prompt +119 -0
pdd/prompts/agentic_bug_step9_e2e_test_LLM.prompt +289 -0
pdd/prompts/agentic_change_step10_identify_issues_LLM.prompt +1006 -0
pdd/prompts/agentic_change_step11_fix_issues_LLM.prompt +984 -0
pdd/prompts/agentic_change_step12_create_pr_LLM.prompt +131 -0
pdd/prompts/agentic_change_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_change_step2_docs_LLM.prompt +101 -0
pdd/prompts/agentic_change_step3_research_LLM.prompt +126 -0
pdd/prompts/agentic_change_step4_clarify_LLM.prompt +164 -0
pdd/prompts/agentic_change_step5_docs_change_LLM.prompt +981 -0
pdd/prompts/agentic_change_step6_devunits_LLM.prompt +1005 -0
pdd/prompts/agentic_change_step7_architecture_LLM.prompt +1044 -0
pdd/prompts/agentic_change_step8_analyze_LLM.prompt +1027 -0
pdd/prompts/agentic_change_step9_implement_LLM.prompt +1077 -0
pdd/prompts/agentic_crash_explore_LLM.prompt +49 -0
pdd/prompts/agentic_e2e_fix_step1_unit_tests_LLM.prompt +90 -0
pdd/prompts/agentic_e2e_fix_step2_e2e_tests_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step3_root_cause_LLM.prompt +89 -0
pdd/prompts/agentic_e2e_fix_step4_fix_e2e_tests_LLM.prompt +96 -0
pdd/prompts/agentic_e2e_fix_step5_identify_devunits_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step6_create_unit_tests_LLM.prompt +106 -0
pdd/prompts/agentic_e2e_fix_step7_verify_tests_LLM.prompt +116 -0
pdd/prompts/agentic_e2e_fix_step8_run_pdd_fix_LLM.prompt +120 -0
pdd/prompts/agentic_e2e_fix_step9_verify_all_LLM.prompt +146 -0
pdd/prompts/agentic_fix_explore_LLM.prompt +45 -0
pdd/prompts/agentic_fix_harvest_only_LLM.prompt +48 -0
pdd/prompts/agentic_fix_primary_LLM.prompt +85 -0
pdd/prompts/agentic_update_LLM.prompt +925 -0
pdd/prompts/agentic_verify_explore_LLM.prompt +45 -0
pdd/prompts/auto_include_LLM.prompt +122 -905
pdd/prompts/change_LLM.prompt +3093 -1
pdd/prompts/detect_change_LLM.prompt +686 -27
pdd/prompts/example_generator_LLM.prompt +22 -1
pdd/prompts/extract_code_LLM.prompt +5 -1
pdd/prompts/extract_program_code_fix_LLM.prompt +7 -1
pdd/prompts/extract_prompt_update_LLM.prompt +7 -8
pdd/prompts/extract_promptline_LLM.prompt +17 -11
pdd/prompts/find_verification_errors_LLM.prompt +6 -0
pdd/prompts/fix_code_module_errors_LLM.prompt +12 -2
pdd/prompts/fix_errors_from_unit_tests_LLM.prompt +9 -0
pdd/prompts/fix_verification_errors_LLM.prompt +22 -0
pdd/prompts/generate_test_LLM.prompt +41 -7
pdd/prompts/generate_test_from_example_LLM.prompt +115 -0
pdd/prompts/increase_tests_LLM.prompt +1 -5
pdd/prompts/insert_includes_LLM.prompt +316 -186
pdd/prompts/prompt_code_diff_LLM.prompt +119 -0
pdd/prompts/prompt_diff_LLM.prompt +82 -0
pdd/prompts/trace_LLM.prompt +25 -22
pdd/prompts/unfinished_prompt_LLM.prompt +85 -1
pdd/prompts/update_prompt_LLM.prompt +22 -1
pdd/pytest_output.py +127 -12
pdd/remote_session.py +876 -0
pdd/render_mermaid.py +236 -0
pdd/server/__init__.py +52 -0
pdd/server/app.py +335 -0
pdd/server/click_executor.py +587 -0
pdd/server/executor.py +338 -0
pdd/server/jobs.py +661 -0
pdd/server/models.py +241 -0
pdd/server/routes/__init__.py +31 -0
pdd/server/routes/architecture.py +451 -0
pdd/server/routes/auth.py +364 -0
pdd/server/routes/commands.py +929 -0
pdd/server/routes/config.py +42 -0
pdd/server/routes/files.py +603 -0
pdd/server/routes/prompts.py +1322 -0
pdd/server/routes/websocket.py +473 -0
pdd/server/security.py +243 -0
pdd/server/terminal_spawner.py +209 -0
pdd/server/token_counter.py +222 -0
pdd/setup_tool.py +648 -0
pdd/simple_math.py +2 -0
pdd/split_main.py +3 -2
pdd/summarize_directory.py +237 -195
pdd/sync_animation.py +8 -4
pdd/sync_determine_operation.py +839 -112
pdd/sync_main.py +351 -57
pdd/sync_orchestration.py +1400 -756
pdd/sync_tui.py +848 -0
pdd/template_expander.py +161 -0
pdd/template_registry.py +264 -0
pdd/templates/architecture/architecture_json.prompt +237 -0
pdd/templates/generic/generate_prompt.prompt +174 -0
pdd/trace.py +168 -12
pdd/trace_main.py +4 -3
pdd/track_cost.py +140 -63
pdd/unfinished_prompt.py +51 -4
pdd/update_main.py +567 -67
pdd/update_model_costs.py +2 -2
pdd/update_prompt.py +19 -4
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/METADATA +29 -11
pdd_cli-0.0.118.dist-info/RECORD +227 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/licenses/LICENSE +1 -1
pdd_cli-0.0.45.dist-info/RECORD +0 -116
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/WHEEL +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/entry_points.txt +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/top_level.txt +0 -0

pdd/fix_code_loop.py CHANGED Viewed

@@ -1,30 +1,289 @@
+from __future__ import annotations
+import json
 import os
 import shutil
 import subprocess
 import sys
+import threading
 from pathlib import Path
-from typing import Tuple, Optional, Union
-from . import DEFAULT_TIME # Added DEFAULT_TIME
+from typing import Tuple, Optional, Union, List
+import requests
+# Try to import DEFAULT_TIME, with fallback
+try:
+    from . import DEFAULT_TIME
+except ImportError:
+    DEFAULT_TIME = 0.5
+# Try to import agentic modules, with fallbacks
+try:
+    from .agentic_crash import run_agentic_crash
+except ImportError:
+    def run_agentic_crash(**kwargs):
+        return (False, "Agentic crash handler not available", 0.0, "N/A", [])
+try:
+    from .get_language import get_language
+except ImportError:
+    def get_language(ext):
+        return "unknown"
+try:
+    from .agentic_langtest import default_verify_cmd_for
+except ImportError:
+    def default_verify_cmd_for(lang, verification_program):
+        return None
+def _normalize_agentic_result(result):
+    """
+    Normalize run_agentic_crash result into: (success: bool, msg: str, cost: float, model: str, changed_files: List[str])
+    Handles older 2/3/4-tuple shapes used by tests/monkeypatches.
+    """
+    if isinstance(result, tuple):
+        if len(result) == 5:
+            ok, msg, cost, model, changed_files = result
+            return bool(ok), str(msg), float(cost), str(model or "agentic-cli"), list(changed_files or [])
+        if len(result) == 4:
+            ok, msg, cost, model = result
+            return bool(ok), str(msg), float(cost), str(model or "agentic-cli"), []
+        if len(result) == 3:
+            ok, msg, cost = result
+            return bool(ok), str(msg), float(cost), "agentic-cli", []
+        if len(result) == 2:
+            ok, msg = result
+            return bool(ok), str(msg), 0.0, "agentic-cli", []
+    # Fallback (shouldn't happen)
+    return False, "Invalid agentic result shape", 0.0, "agentic-cli", []
+def _safe_run_agentic_crash(*, prompt_file, code_file, program_file, crash_log_file, cwd=None):
+    """
+    Call (possibly monkeypatched) run_agentic_crash and normalize its return.
+    Maps arguments to the expected signature of run_agentic_crash.
+    Note: cwd parameter is accepted for compatibility but not passed to run_agentic_crash
+    as it determines the working directory from prompt_file.parent internally.
+    """
+    if not prompt_file:
+        return False, "Agentic fix requires a valid prompt file.", 0.0, "agentic-cli", []
+    try:
+        # Ensure inputs are Path objects as expected by run_agentic_crash
+        call_args = {
+            "prompt_file": Path(prompt_file),
+            "code_file": Path(code_file),
+            "program_file": Path(program_file),
+            "crash_log_file": Path(crash_log_file),
+            "verbose": True,
+            "quiet": False,
+        }
+        # Note: cwd is not passed - run_agentic_crash uses prompt_file.parent as project root
+        res = run_agentic_crash(**call_args)
+        return _normalize_agentic_result(res)
+    except Exception as e:
+        return False, f"Agentic crash handler failed: {e}", 0.0, "agentic-cli", []
 # Use Rich for pretty printing to the console
-from rich.console import Console
-# Initialize Rich Console
-console = Console(record=True)
-rprint = console.print
+try:
+    from rich.console import Console
+    console = Console(record=True)
+    rprint = console.print
+except ImportError:
+    # Fallback if Rich is not available
+    def rprint(*args, **kwargs):
+        print(*args)
+# Cloud configuration
+try:
+    from .core.cloud import CloudConfig
+    CLOUD_AVAILABLE = True
+except ImportError:
+    CLOUD_AVAILABLE = False
+    CloudConfig = None
+# Cloud request timeout for crash fix
+CLOUD_REQUEST_TIMEOUT = 400  # seconds
+def cloud_crash_fix(
+    program: str,
+    prompt: str,
+    code: str,
+    errors: str,
+    strength: float,
+    temperature: float,
+    time: float,
+    verbose: bool,
+    program_path: str = "",
+    code_path: str = "",
+    language: str = "python",
+) -> Tuple[bool, bool, str, str, str, float, Optional[str]]:
+    """
+    Call cloud crashCode endpoint for LLM crash fix.
+    Returns:
+        Tuple of (update_program, update_code, fixed_program, fixed_code, analysis, cost, model_name)
+    """
+    if not CLOUD_AVAILABLE or CloudConfig is None:
+        raise RuntimeError("Cloud configuration not available")
+    jwt_token = CloudConfig.get_jwt_token(verbose=verbose)
+    if not jwt_token:
+        raise RuntimeError("Cloud authentication failed - no JWT token")
+    payload = {
+        "programContent": program,
+        "promptContent": prompt,
+        "codeContent": code,
+        "errorContent": errors,
+        "language": language,
+        "strength": strength,
+        "temperature": temperature,
+        "time": time if time is not None else 0.25,
+        "verbose": verbose,
+        "programPath": program_path,
+        "codePath": code_path,
+    }
+    headers = {
+        "Authorization": f"Bearer {jwt_token}",
+        "Content-Type": "application/json"
+    }
+    cloud_url = CloudConfig.get_endpoint_url("crashCode")
+    response = requests.post(
+        cloud_url,
+        json=payload,
+        headers=headers,
+        timeout=CLOUD_REQUEST_TIMEOUT
+    )
+    response.raise_for_status()
+    response_data = response.json()
+    fixed_code = response_data.get("fixedCode", "")
+    fixed_program = response_data.get("fixedProgram", "")
+    update_code = response_data.get("updateCode", False)
+    update_program = response_data.get("updateProgram", False)
+    analysis = response_data.get("analysis", "")
+    cost = float(response_data.get("totalCost", 0.0))
+    model_name = response_data.get("modelName", "cloud_model")
+    return update_program, update_code, fixed_program, fixed_code, analysis, cost, model_name
 # Use relative import for internal modules
 try:
-    # Attempt relative import for package context
     from .fix_code_module_errors import fix_code_module_errors
 except ImportError:
-    # Fallback for script execution context (e.g., testing)
-    # This assumes fix_code_module_errors.py is in the same directory or Python path
-    # You might need to adjust this based on your project structure during testing
-    print("Warning: Relative import failed. Attempting direct import for fix_code_module_errors.", file=sys.stderr)
-    # Add parent directory to sys.path if necessary for testing outside a package
-    # import sys
-    # sys.path.append(str(Path(__file__).parent.parent)) # Adjust based on structure
-    from fix_code_module_errors import fix_code_module_errors
+    try:
+        from fix_code_module_errors import fix_code_module_errors
+    except ImportError:
+        # Provide a stub that will fail gracefully
+        def fix_code_module_errors(**kwargs):
+            return (False, False, "", "", "Module not available", 0.0, None)
+class ProcessResult:
+    def __init__(self, returncode, stdout, stderr):
+        self.returncode = returncode
+        self.stdout = stdout
+        self.stderr = stderr
+def run_process_with_output(cmd_args, timeout=300):
+    """
+    Runs a process, streaming stdout/stderr to the console while capturing them.
+    Allows interaction via stdin.
+    Uses start_new_session=True to create a new process group, allowing us to
+    kill all child processes if the main process times out.
+    """
+    import os
+    import signal
+    try:
+        proc = subprocess.Popen(
+            cmd_args,
+            stdin=subprocess.DEVNULL,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            bufsize=0,
+            start_new_session=True  # Create new process group for clean termination
+        )
+    except Exception as e:
+        return -1, "", str(e)
+    captured_stdout = []
+    captured_stderr = []
+    def stream_pipe(pipe, sink, capture_list):
+        while True:
+            try:
+                chunk = pipe.read(1)
+                if not chunk:
+                    break
+                capture_list.append(chunk)
+            except (ValueError, IOError, OSError):
+                # OSError can occur when pipe is closed during read
+                break
+    t_out = threading.Thread(target=stream_pipe, args=(proc.stdout, sys.stdout, captured_stdout), daemon=True)
+    t_err = threading.Thread(target=stream_pipe, args=(proc.stderr, sys.stderr, captured_stderr), daemon=True)
+    t_out.start()
+    t_err.start()
+    timed_out = False
+    try:
+        proc.wait(timeout=timeout)
+    except subprocess.TimeoutExpired:
+        timed_out = True
+        captured_stderr.append(b"\n[Timeout]\n")
+    # Kill process and entire process group if needed
+    if timed_out or proc.returncode is None:
+        try:
+            # Kill entire process group to handle forked children
+            os.killpg(os.getpgid(proc.pid), signal.SIGKILL)
+        except (ProcessLookupError, OSError):
+            # Process group may already be dead
+            pass
+        try:
+            proc.kill()
+            proc.wait(timeout=5)
+        except Exception:
+            pass
+    # Wait for threads to finish reading with timeout
+    # For normal completion, threads will exit when they read EOF from the pipe
+    # For timeout/kill cases, we may need to close pipes to unblock them
+    THREAD_JOIN_TIMEOUT = 5  # seconds - enough time to drain normal output buffers
+    t_out.join(timeout=THREAD_JOIN_TIMEOUT)
+    t_err.join(timeout=THREAD_JOIN_TIMEOUT)
+    # If threads are still alive after first timeout, close pipes to unblock them
+    # This handles cases where child processes keep pipes open
+    if t_out.is_alive() or t_err.is_alive():
+        try:
+            proc.stdout.close()
+        except Exception:
+            pass
+        try:
+            proc.stderr.close()
+        except Exception:
+            pass
+        # Give threads a bit more time after closing pipes
+        t_out.join(timeout=2)
+        t_err.join(timeout=2)
+    # If threads are still alive after all attempts, log it
+    if t_out.is_alive() or t_err.is_alive():
+        captured_stderr.append(b"\n[Thread join timeout - some output may be lost]\n")
+    stdout_str = b"".join(captured_stdout).decode('utf-8', errors='replace')
+    stderr_str = b"".join(captured_stderr).decode('utf-8', errors='replace')
+    return proc.returncode if proc.returncode is not None else -1, stdout_str, stderr_str
 def fix_code_loop(
@@ -38,10 +297,18 @@ def fix_code_loop(
     error_log_file: str,
     verbose: bool = False,
     time: float = DEFAULT_TIME,
+    prompt_file: str = "",
+    agentic_fallback: bool = True,
+    use_cloud: bool = False,
 ) -> Tuple[bool, str, str, int, float, Optional[str]]:
     """
     Attempts to fix errors in a code module through multiple iterations.
+    Hybrid Cloud Support:
+        When use_cloud=True, the LLM fix calls are routed to the cloud crashCode endpoint
+        while local verification program execution stays local. This allows the loop to
+        pass local verification results to the cloud for analysis and fixes.
     Args:
         code_file: Path to the code file being tested.
         prompt: The prompt that generated the code under test.
@@ -53,6 +320,9 @@ def fix_code_loop(
         error_log_file: Path to the error log file.
         verbose: Enable detailed logging (default: False).
         time: Time limit for the LLM calls (default: DEFAULT_TIME).
+        prompt_file: Path to the prompt file.
+        agentic_fallback: Enable agentic fallback if the primary fix mechanism fails.
+        use_cloud: If True, use cloud LLM for fix calls while keeping verification execution local.
     Returns:
         Tuple containing the following in order:
@@ -63,15 +333,98 @@ def fix_code_loop(
         - total_cost (float): Total cost of all fix attempts.
         - model_name (str | None): Name of the LLM model used (or None if no LLM calls were made).
     """
-    # --- Start: Modified File Checks ---
+    # Handle default time if passed as None (though signature defaults to DEFAULT_TIME)
+    if time is None:
+        time = DEFAULT_TIME
+    # --- Start: File Checks ---
     if not Path(code_file).is_file():
-        # Raising error for code file is acceptable as it's fundamental
         raise FileNotFoundError(f"Code file not found: {code_file}")
     if not Path(verification_program).is_file():
-        # Handle missing verification program gracefully as per test expectation
         rprint(f"[bold red]Error: Verification program not found: {verification_program}[/bold red]")
         return False, "", "", 0, 0.0, None
-    # --- End: Modified File Checks ---
+    # --- End: File Checks ---
+    is_python = str(code_file).lower().endswith(".py")
+    if not is_python:
+        # For non-Python files, run the verification program to get an initial error state
+        rprint(f"[cyan]Non-Python target detected. Running verification program to get initial state...[/cyan]")
+        lang = get_language(os.path.splitext(code_file)[1])
+        verify_cmd = default_verify_cmd_for(lang, verification_program)
+        if not verify_cmd:
+            # No verify command available (e.g., Java without maven/gradle).
+            # Trigger agentic fallback directly using any existing error log.
+            rprint(f"[cyan]No verification command for {lang}. Triggering agentic fallback directly...[/cyan]")
+            error_log_path = Path(error_log_file)
+            error_log_path.parent.mkdir(parents=True, exist_ok=True)
+            # Read existing error content or create minimal log
+            if not error_log_path.exists() or error_log_path.stat().st_size == 0:
+                with open(error_log_path, "w") as f:
+                    f.write(f"No verification command available for language: {lang}\n")
+                    f.write("Agentic fix will attempt to resolve the issue.\n")
+            success, _msg, agent_cost, agent_model, agent_changed_files = _safe_run_agentic_crash(
+                prompt_file=prompt_file,
+                code_file=code_file,
+                program_file=verification_program,
+                crash_log_file=error_log_file,
+                cwd=Path(prompt_file).parent if prompt_file else None
+            )
+            final_program = ""
+            final_code = ""
+            try:
+                with open(verification_program, "r") as f:
+                    final_program = f.read()
+            except Exception:
+                pass
+            try:
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception:
+                pass
+            return success, final_program, final_code, 1, agent_cost, agent_model
+        verify_result = subprocess.run(verify_cmd, capture_output=True, text=True, shell=True)
+        pytest_output = (verify_result.stdout or "") + "\n" + (verify_result.stderr or "")
+        if verify_result.returncode != 0:
+            rprint("[cyan]Non-Python target failed initial verification. Triggering agentic fallback...[/cyan]")
+            error_log_path = Path(error_log_file)
+            error_log_path.parent.mkdir(parents=True, exist_ok=True)
+            with open(error_log_path, "w") as f:
+                f.write(pytest_output)
+            success, _msg, agent_cost, agent_model, agent_changed_files = _safe_run_agentic_crash(
+                prompt_file=prompt_file,
+                code_file=code_file,
+                program_file=verification_program,
+                crash_log_file=error_log_file,
+                cwd=Path(prompt_file).parent if prompt_file else None
+            )
+            final_program = ""
+            final_code = ""
+            try:
+                with open(verification_program, "r") as f:
+                    final_program = f.read()
+            except Exception:
+                pass
+            try:
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception:
+                pass
+            return success, final_program, final_code, 1, agent_cost, agent_model
+        else:
+            rprint("[green]Non-Python tests passed. No fix needed.[/green]")
+            try:
+                final_program = ""
+                final_code = ""
+                with open(verification_program, "r") as f:
+                    final_program = f.read()
+                with open(code_file, "r") as f:
+                    final_code = f.read()
+            except Exception as e:
+                rprint(f"[yellow]Warning: Could not read final files: {e}[/yellow]")
+            return True, final_program, final_code, 0, 0.0, "N/A"
     # Step 1: Remove existing error log file
     try:
@@ -83,20 +436,26 @@ def fix_code_loop(
             rprint(f"Error log file not found, no need to remove: {error_log_file}")
     except OSError as e:
         rprint(f"[bold red]Error removing log file {error_log_file}: {e}[/bold red]")
-        # Decide if this is fatal or not; for now, we continue
     # Step 2: Initialize variables
     attempts = 0
     total_cost = 0.0
     success = False
     model_name = None
-    history_log = "<history>\n" # Initialize history log XML root
+    history_log = "<history>\n"
     # Create initial backups before any modifications
+    # Store in .pdd/backups/ to avoid polluting code/test directories
+    from datetime import datetime
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
     code_file_path = Path(code_file)
     verification_program_path = Path(verification_program)
-    original_code_backup = f"{code_file_path.stem}_original_backup{code_file_path.suffix}"
-    original_program_backup = f"{verification_program_path.stem}_original_backup{verification_program_path.suffix}"
+    backup_dir = Path.cwd() / '.pdd' / 'backups' / code_file_path.stem / timestamp
+    backup_dir.mkdir(parents=True, exist_ok=True)
+    original_code_backup = str(backup_dir / f"code_original{code_file_path.suffix}")
+    original_program_backup = str(backup_dir / f"program_original{verification_program_path.suffix}")
     try:
         shutil.copy2(code_file, original_code_backup)
@@ -105,33 +464,41 @@ def fix_code_loop(
             rprint(f"Created initial backups: {original_code_backup}, {original_program_backup}")
     except Exception as e:
         rprint(f"[bold red]Error creating initial backups: {e}[/bold red]")
-        # If backups fail, we cannot guarantee restoration. Return failure.
         return False, "", "", 0, 0.0, None
+    # Initialize process for scope
+    process = None
     # Step 3: Enter the fixing loop
     while attempts < max_attempts and total_cost <= budget:
-        current_attempt = attempts + 1 # User-facing attempt number (starts at 1)
-        rprint(f"\n[bold cyan]Attempt {current_attempt}/{max_attempts}...[/bold cyan]")
-        attempt_log_entry = f'  <attempt number="{current_attempt}">\n' # Start XML for this attempt
+        # current_attempt is used for logging the current iteration number
+        current_iteration_number = attempts + 1
+        rprint(f"\n[bold cyan]Attempt {current_iteration_number}/{max_attempts}...[/bold cyan]")
+        attempt_log_entry = f'  <attempt number="{current_iteration_number}">\n'
         # b. Run the verification program
         if verbose:
             rprint(f"Running verification: {sys.executable} {verification_program}")
-        process = subprocess.run(
-            [sys.executable, verification_program],
-            capture_output=True,
-            text=True,
-            encoding='utf-8', # Ensure consistent encoding
-        )
+        try:
+            returncode, stdout, stderr = run_process_with_output(
+                [sys.executable, verification_program],
+                timeout=300
+            )
+            process = ProcessResult(returncode, stdout, stderr)
+            verification_status = f"Success (Return Code: {process.returncode})" if process.returncode == 0 else f"Failure (Return Code: {process.returncode})"
+            verification_output = process.stdout or "[No standard output]"
+            verification_error = process.stderr or "[No standard error]"
+        except Exception as e:
+            verification_status = f"Failure (Exception: {e})"
+            verification_output = "[Exception occurred]"
+            verification_error = str(e)
+            process = ProcessResult(-1, "", str(e))
-        verification_status = f"Success (Return Code: {process.returncode})" if process.returncode == 0 else f"Failure (Return Code: {process.returncode})"
-        verification_output = process.stdout or "[No standard output]"
-        verification_error = process.stderr or "[No standard error]"
         # Add verification results to the attempt log entry
-        attempt_log_entry += f"""\
+        attempt_log_entry += f"""
     <verification>
       <status>{verification_status}</status>
       <output><![CDATA[
@@ -155,7 +522,7 @@ def fix_code_loop(
         current_error_message = verification_error # Use stderr as the primary error source
         # Add current error to the attempt log entry
-        attempt_log_entry += f"""\
+        attempt_log_entry += f"""
     <current_error><![CDATA[
 {current_error_message}
 ]]></current_error>
@@ -164,30 +531,29 @@ def fix_code_loop(
         # Check budget *before* making the potentially expensive LLM call for the next attempt
         # (Only check if cost > 0 to avoid breaking before first attempt if budget is 0)
         if total_cost > budget and attempts > 0: # Check after first attempt cost is added
-             rprint(f"[bold yellow]Budget exceeded (${total_cost:.4f} > ${budget:.4f}) before attempt {current_attempt}. Stopping.[/bold yellow]")
+             rprint(f"[bold yellow]Budget exceeded (${total_cost:.4f} > ${budget:.4f}) before attempt {current_iteration_number}. Stopping.[/bold yellow]")
              history_log += attempt_log_entry + "    <error>Budget exceeded before LLM call</error>\n  </attempt>\n"
              break
         # Check max attempts *before* the LLM call for this attempt
         if attempts >= max_attempts:
-             rprint(f"[bold red]Maximum attempts ({max_attempts}) reached before attempt {current_attempt}. Stopping.[/bold red]")
+             rprint(f"[bold red]Maximum attempts ({max_attempts}) reached before attempt {current_iteration_number}. Stopping.[/bold red]")
              # No need to add to history here, loop condition handles it
              break
         # Create backup copies for this iteration BEFORE calling LLM
-        code_base, code_ext = os.path.splitext(code_file)
-        program_base, program_ext = os.path.splitext(verification_program)
-        code_backup_path = f"{code_base}_{current_attempt}{code_ext}"
-        program_backup_path = f"{program_base}_{current_attempt}{program_ext}"
+        # Store in .pdd/backups/ (backup_dir already created above)
+        code_backup_path = str(backup_dir / f"code_{current_iteration_number}{code_file_path.suffix}")
+        program_backup_path = str(backup_dir / f"program_{current_iteration_number}{verification_program_path.suffix}")
         try:
             shutil.copy2(code_file, code_backup_path)
             shutil.copy2(verification_program, program_backup_path)
             if verbose:
-                rprint(f"Created backups for attempt {current_attempt}: {code_backup_path}, {program_backup_path}")
+                rprint(f"Created backups for attempt {current_iteration_number}: {code_backup_path}, {program_backup_path}")
         except Exception as e:
-            rprint(f"[bold red]Error creating backups for attempt {current_attempt}: {e}[/bold red]")
+            rprint(f"[bold red]Error creating backups for attempt {current_iteration_number}: {e}[/bold red]")
             history_log += attempt_log_entry + f"    <error>Failed to create backups: {e}</error>\n  </attempt>\n"
             break # Cannot proceed reliably without backups
@@ -204,7 +570,7 @@ def fix_code_loop(
         # Temporarily close the XML structure for the LLM call
         error_context_for_llm = history_log + attempt_log_entry + "  </attempt>\n</history>\n"
-        # Call fix_code_module_errors
+        # Call fix (cloud or local based on use_cloud parameter)
         rprint("Attempting to fix errors using LLM...")
         update_program, update_code, fixed_program, fixed_code = False, False, "", ""
         program_code_fix, cost, model_name_iter = "", 0.0, None
@@ -214,36 +580,79 @@ def fix_code_loop(
         # For simplicity, we assume fix_code_module_errors prints directly using `rprint`
         try:
-            # Note: The example signature for fix_code_module_errors returns 7 values
-            (update_program, update_code, fixed_program, fixed_code,
-             program_code_fix, cost, model_name_iter) = fix_code_module_errors(
-                program=current_program,
-                prompt=prompt,
-                code=current_code,
-                errors=error_context_for_llm, # Pass the structured history
-                strength=strength,
-                temperature=temperature,
-                time=time, # Pass time
-                verbose=verbose,
-            )
-            if model_name_iter:
-                 model_name = model_name_iter # Update model name if returned
+            if use_cloud:
+                # Use cloud LLM for fix - local verification results passed via error_context_for_llm
+                try:
+                    (update_program, update_code, fixed_program, fixed_code,
+                     program_code_fix, cost, model_name_iter) = cloud_crash_fix(
+                        program=current_program,
+                        prompt=prompt,
+                        code=current_code,
+                        errors=error_context_for_llm,
+                        strength=strength,
+                        temperature=temperature,
+                        time=time,
+                        verbose=verbose,
+                        program_path=verification_program,
+                        code_path=code_file,
+                        language="python" if is_python else get_language(os.path.splitext(code_file)[1]),
+                    )
+                    if model_name_iter:
+                        model_name = model_name_iter
+                    if verbose:
+                        rprint(f"[cyan]Cloud crash fix completed. Cost: ${cost:.4f}[/cyan]")
+                except (requests.exceptions.RequestException, RuntimeError) as cloud_err:
+                    # Cloud failed - fall back to local
+                    rprint(f"[yellow]Cloud crash fix failed: {cloud_err}. Falling back to local.[/yellow]")
+                    (update_program, update_code, fixed_program, fixed_code,
+                     program_code_fix, cost, model_name_iter) = fix_code_module_errors(
+                        program=current_program,
+                        prompt=prompt,
+                        code=current_code,
+                        errors=error_context_for_llm,
+                        strength=strength,
+                        temperature=temperature,
+                        time=time,
+                        verbose=verbose,
+                        program_path=verification_program,
+                        code_path=code_file,
+                    )
+                    if model_name_iter:
+                        model_name = model_name_iter
+            else:
+                # Local LLM fix
+                # Note: The example signature for fix_code_module_errors returns 7 values
+                (update_program, update_code, fixed_program, fixed_code,
+                 program_code_fix, cost, model_name_iter) = fix_code_module_errors(
+                    program=current_program,
+                    prompt=prompt,
+                    code=current_code,
+                    errors=error_context_for_llm, # Pass the structured history
+                    strength=strength,
+                    temperature=temperature,
+                    time=time, # Pass time
+                    verbose=verbose,
+                    program_path=verification_program,  # Pass file path for LLM context
+                    code_path=code_file,                # Pass file path for LLM context
+                )
+                if model_name_iter:
+                     model_name = model_name_iter # Update model name if returned
         except Exception as e:
             rprint(f"[bold red]Error calling fix_code_module_errors: {e}[/bold red]")
             cost = 0.0 # Assume no cost if the call failed
             # Add error to the attempt log entry
-            attempt_log_entry += f"""\
+            attempt_log_entry += f"""
     <fixing>
       <error>LLM call failed: {e}</error>
     </fixing>
 """
-            # Continue to the next attempt or break if limits reached? Let's break.
             history_log += attempt_log_entry + "  </attempt>\n" # Log the attempt with the LLM error
+            attempts += 1 # Increment attempts even if LLM call failed
             break # Stop if the fixing mechanism itself fails
         # Add fixing results to the attempt log entry
-        attempt_log_entry += f"""\
+        attempt_log_entry += f"""
     <fixing>
       <llm_analysis><![CDATA[
 {program_code_fix or "[No analysis provided]"}
@@ -269,11 +678,13 @@ def fix_code_loop(
             rprint(f"[bold red]Error writing to log file {error_log_file}: {e}[/bold red]")
-        # Add cost and check budget *after* the LLM call
+        # Add cost and increment attempt counter (as per fix report) *before* checking budget
         total_cost += cost
+        attempts += 1 # Moved this line here as per fix report
         rprint(f"Attempt Cost: ${cost:.4f}, Total Cost: ${total_cost:.4f}, Budget: ${budget:.4f}")
         if total_cost > budget:
-            rprint(f"[bold yellow]Budget exceeded (${total_cost:.4f} > ${budget:.4f}) after attempt {current_attempt}. Stopping.[/bold yellow]")
+            rprint(f"[bold yellow]Budget exceeded (${total_cost:.4f} > ${budget:.4f}) after attempt {attempts}. Stopping.[/bold yellow]")
             break # Stop loop
         # If LLM suggested no changes but verification failed, stop to prevent loops
@@ -295,8 +706,7 @@ def fix_code_loop(
             success = False # Mark as failed if we can't write updates
             break # Stop if we cannot apply fixes
-        # e. Increment attempt counter (used for loop condition)
-        attempts += 1
+        # The original 'attempts += 1' was here. It has been moved earlier.
         # Check if max attempts reached after incrementing (for the next loop iteration check)
         if attempts >= max_attempts:
@@ -358,39 +768,57 @@ def fix_code_loop(
         rprint(f"[bold red]Final write to log file {error_log_file} failed: {e}[/bold red]")
     # Determine final number of attempts for reporting
-    # If loop finished by verification success (success=True), attempts = attempts made
-    # If loop finished by failure (budget, max_attempts, no_change_needed, error),
-    # the number of attempts *initiated* is 'attempts + 1' unless max_attempts was exactly hit.
-    # The tests seem to expect the number of attempts *initiated*.
-    # Let's refine the calculation slightly for clarity.
-    # 'attempts' holds the count of *completed* loops (0-indexed).
-    # 'current_attempt' holds the user-facing number (1-indexed) of the loop *currently running or just finished*.
+    # The 'attempts' variable correctly counts the number of LLM fix cycles that were initiated.
     final_attempts_reported = attempts
-    if not success:
-        # If failure occurred, it happened *during* or *after* the 'current_attempt' was initiated.
-        # If loop broke due to budget/no_change/error, current_attempt reflects the attempt number where failure occurred.
-        # If loop broke because attempts >= max_attempts, the last valid value for current_attempt was max_attempts.
-        # The number of attempts *tried* is current_attempt.
-        # However, the tests seem aligned with the previous logic. Let's stick to it unless further tests fail.
-        final_attempts_reported = attempts if success else (attempts + 1 if attempts < max_attempts and process.returncode != 0 else attempts)
-        # Re-evaluating the test logic:
-        # - Budget test: attempts=1 when loop breaks, expects 2. (attempts+1) -> 2. Correct.
-        # - Max attempts test: attempts=0 when loop breaks (no change), max_attempts=2, expects <=2. (attempts+1) -> 1. Correct.
-        # - If max_attempts=2 was reached *normally* (failed attempt 1, failed attempt 2), attempts would be 2.
-        #   The logic `attempts + 1 if attempts < max_attempts else attempts` would return 2. Correct.
-        # Let's simplify the return calculation based on 'attempts' which counts completed loops.
-        final_attempts_reported = attempts # Number of fully completed fix cycles
-        if not success and process and process.returncode != 0: # If we failed after at least one verification run
-             # Count the final failed attempt unless success was achieved on the very last possible attempt
-             if attempts < max_attempts:
-                 final_attempts_reported += 1
+    if not success and agentic_fallback:
+        # Ensure error_log_file exists before calling agentic fix
+        try:
+            if not os.path.exists(error_log_file) or os.path.getsize(error_log_file) == 0:
+                # Write minimal error log for agentic fix
+                error_log_path = Path(error_log_file)
+                error_log_path.parent.mkdir(parents=True, exist_ok=True)
+                with open(error_log_path, "w") as elog:
+                    if process:
+                        elog.write(f"Verification failed with return code: {process.returncode}\n")
+                        if process.stdout:
+                            elog.write(f"\nStdout:\n{process.stdout}\n")
+                        if process.stderr:
+                            elog.write(f"\nStderr:\n{process.stderr}\n")
+                    else:
+                        elog.write("No error information available\n")
+        except Exception as e:
+            rprint(f"[yellow]Warning: Could not write error log before agentic fallback: {e}[/yellow]")
+        rprint(f"[cyan]Attempting agentic fallback (prompt_file={prompt_file!r})...[/cyan]")
+        agent_success, agent_msg, agent_cost, agent_model, agent_changed_files = _safe_run_agentic_crash(
+            prompt_file=prompt_file,
+            code_file=code_file,
+            program_file=verification_program,
+            crash_log_file=error_log_file,
+            cwd=Path(prompt_file).parent if prompt_file else None
+        )
+        total_cost += agent_cost
+        if not agent_success:
+            rprint(f"[bold red]Agentic fallback failed: {agent_msg}[/bold red]")
+        if agent_changed_files:
+            rprint(f"[cyan]Agent modified {len(agent_changed_files)} file(s):[/cyan]")
+            for f in agent_changed_files:
+                rprint(f"  • {f}")
+        if agent_success:
+            model_name = agent_model or model_name
+            try:
+                final_code_content = Path(code_file).read_text(encoding='utf-8')
+                final_program_content = Path(verification_program).read_text(encoding='utf-8')
+            except Exception as e:
+                rprint(f"[yellow]Warning: Could not read files after successful agentic fix: {e}[/yellow]")
+            success = True
     return (
         success,
         final_program_content,
         final_code_content,
-        final_attempts_reported, # Use the refined calculation
+        final_attempts_reported,
         total_cost,
         model_name,
     )
@@ -519,4 +947,4 @@ sys.exit(0) # Exit with zero code for success
     #     for f in Path(".").glob("dummy_verify_*.py"): # Remove attempt backups like dummy_verify_1.py
     #          if "_original_backup" not in f.name: os.remove(f)
     # except OSError as e:
-    #     print(f"Error cleaning up dummy files: {e}")
+    #     print(f"Error cleaning up dummy files: {e}")

pdd-cli 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl