PyPI - pdd-cli - Versions diffs - 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl - Mend

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

pdd/__init__.py +40 -8
pdd/agentic_bug.py +323 -0
pdd/agentic_bug_orchestrator.py +497 -0
pdd/agentic_change.py +231 -0
pdd/agentic_change_orchestrator.py +526 -0
pdd/agentic_common.py +598 -0
pdd/agentic_crash.py +534 -0
pdd/agentic_e2e_fix.py +319 -0
pdd/agentic_e2e_fix_orchestrator.py +426 -0
pdd/agentic_fix.py +1294 -0
pdd/agentic_langtest.py +162 -0
pdd/agentic_update.py +387 -0
pdd/agentic_verify.py +183 -0
pdd/architecture_sync.py +565 -0
pdd/auth_service.py +210 -0
pdd/auto_deps_main.py +71 -51
pdd/auto_include.py +245 -5
pdd/auto_update.py +125 -47
pdd/bug_main.py +196 -23
pdd/bug_to_unit_test.py +2 -0
pdd/change_main.py +11 -4
pdd/cli.py +22 -1181
pdd/cmd_test_main.py +350 -150
pdd/code_generator.py +60 -18
pdd/code_generator_main.py +790 -57
pdd/commands/__init__.py +48 -0
pdd/commands/analysis.py +306 -0
pdd/commands/auth.py +309 -0
pdd/commands/connect.py +290 -0
pdd/commands/fix.py +163 -0
pdd/commands/generate.py +257 -0
pdd/commands/maintenance.py +175 -0
pdd/commands/misc.py +87 -0
pdd/commands/modify.py +256 -0
pdd/commands/report.py +144 -0
pdd/commands/sessions.py +284 -0
pdd/commands/templates.py +215 -0
pdd/commands/utility.py +110 -0
pdd/config_resolution.py +58 -0
pdd/conflicts_main.py +8 -3
pdd/construct_paths.py +589 -111
pdd/context_generator.py +10 -2
pdd/context_generator_main.py +175 -76
pdd/continue_generation.py +53 -10
pdd/core/__init__.py +33 -0
pdd/core/cli.py +527 -0
pdd/core/cloud.py +237 -0
pdd/core/dump.py +554 -0
pdd/core/errors.py +67 -0
pdd/core/remote_session.py +61 -0
pdd/core/utils.py +90 -0
pdd/crash_main.py +262 -33
pdd/data/language_format.csv +71 -63
pdd/data/llm_model.csv +20 -18
pdd/detect_change_main.py +5 -4
pdd/docs/prompting_guide.md +864 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/benchmark_analysis.py +495 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/creation_compare.py +528 -0
pdd/fix_code_loop.py +523 -95
pdd/fix_code_module_errors.py +6 -2
pdd/fix_error_loop.py +491 -92
pdd/fix_errors_from_unit_tests.py +4 -3
pdd/fix_main.py +278 -21
pdd/fix_verification_errors.py +12 -100
pdd/fix_verification_errors_loop.py +529 -286
pdd/fix_verification_main.py +294 -89
pdd/frontend/dist/assets/index-B5DZHykP.css +1 -0
pdd/frontend/dist/assets/index-DQ3wkeQ2.js +449 -0
pdd/frontend/dist/index.html +376 -0
pdd/frontend/dist/logo.svg +33 -0
pdd/generate_output_paths.py +139 -15
pdd/generate_test.py +218 -146
pdd/get_comment.py +19 -44
pdd/get_extension.py +8 -9
pdd/get_jwt_token.py +318 -22
pdd/get_language.py +8 -7
pdd/get_run_command.py +75 -0
pdd/get_test_command.py +68 -0
pdd/git_update.py +70 -19
pdd/incremental_code_generator.py +2 -2
pdd/insert_includes.py +13 -4
pdd/llm_invoke.py +1711 -181
pdd/load_prompt_template.py +19 -12
pdd/path_resolution.py +140 -0
pdd/pdd_completion.fish +25 -2
pdd/pdd_completion.sh +30 -4
pdd/pdd_completion.zsh +79 -4
pdd/postprocess.py +14 -4
pdd/preprocess.py +293 -24
pdd/preprocess_main.py +41 -6
pdd/prompts/agentic_bug_step10_pr_LLM.prompt +182 -0
pdd/prompts/agentic_bug_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_bug_step2_docs_LLM.prompt +129 -0
pdd/prompts/agentic_bug_step3_triage_LLM.prompt +95 -0
pdd/prompts/agentic_bug_step4_reproduce_LLM.prompt +97 -0
pdd/prompts/agentic_bug_step5_root_cause_LLM.prompt +123 -0
pdd/prompts/agentic_bug_step6_test_plan_LLM.prompt +107 -0
pdd/prompts/agentic_bug_step7_generate_LLM.prompt +172 -0
pdd/prompts/agentic_bug_step8_verify_LLM.prompt +119 -0
pdd/prompts/agentic_bug_step9_e2e_test_LLM.prompt +289 -0
pdd/prompts/agentic_change_step10_identify_issues_LLM.prompt +1006 -0
pdd/prompts/agentic_change_step11_fix_issues_LLM.prompt +984 -0
pdd/prompts/agentic_change_step12_create_pr_LLM.prompt +131 -0
pdd/prompts/agentic_change_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_change_step2_docs_LLM.prompt +101 -0
pdd/prompts/agentic_change_step3_research_LLM.prompt +126 -0
pdd/prompts/agentic_change_step4_clarify_LLM.prompt +164 -0
pdd/prompts/agentic_change_step5_docs_change_LLM.prompt +981 -0
pdd/prompts/agentic_change_step6_devunits_LLM.prompt +1005 -0
pdd/prompts/agentic_change_step7_architecture_LLM.prompt +1044 -0
pdd/prompts/agentic_change_step8_analyze_LLM.prompt +1027 -0
pdd/prompts/agentic_change_step9_implement_LLM.prompt +1077 -0
pdd/prompts/agentic_crash_explore_LLM.prompt +49 -0
pdd/prompts/agentic_e2e_fix_step1_unit_tests_LLM.prompt +90 -0
pdd/prompts/agentic_e2e_fix_step2_e2e_tests_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step3_root_cause_LLM.prompt +89 -0
pdd/prompts/agentic_e2e_fix_step4_fix_e2e_tests_LLM.prompt +96 -0
pdd/prompts/agentic_e2e_fix_step5_identify_devunits_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step6_create_unit_tests_LLM.prompt +106 -0
pdd/prompts/agentic_e2e_fix_step7_verify_tests_LLM.prompt +116 -0
pdd/prompts/agentic_e2e_fix_step8_run_pdd_fix_LLM.prompt +120 -0
pdd/prompts/agentic_e2e_fix_step9_verify_all_LLM.prompt +146 -0
pdd/prompts/agentic_fix_explore_LLM.prompt +45 -0
pdd/prompts/agentic_fix_harvest_only_LLM.prompt +48 -0
pdd/prompts/agentic_fix_primary_LLM.prompt +85 -0
pdd/prompts/agentic_update_LLM.prompt +925 -0
pdd/prompts/agentic_verify_explore_LLM.prompt +45 -0
pdd/prompts/auto_include_LLM.prompt +122 -905
pdd/prompts/change_LLM.prompt +3093 -1
pdd/prompts/detect_change_LLM.prompt +686 -27
pdd/prompts/example_generator_LLM.prompt +22 -1
pdd/prompts/extract_code_LLM.prompt +5 -1
pdd/prompts/extract_program_code_fix_LLM.prompt +7 -1
pdd/prompts/extract_prompt_update_LLM.prompt +7 -8
pdd/prompts/extract_promptline_LLM.prompt +17 -11
pdd/prompts/find_verification_errors_LLM.prompt +6 -0
pdd/prompts/fix_code_module_errors_LLM.prompt +12 -2
pdd/prompts/fix_errors_from_unit_tests_LLM.prompt +9 -0
pdd/prompts/fix_verification_errors_LLM.prompt +22 -0
pdd/prompts/generate_test_LLM.prompt +41 -7
pdd/prompts/generate_test_from_example_LLM.prompt +115 -0
pdd/prompts/increase_tests_LLM.prompt +1 -5
pdd/prompts/insert_includes_LLM.prompt +316 -186
pdd/prompts/prompt_code_diff_LLM.prompt +119 -0
pdd/prompts/prompt_diff_LLM.prompt +82 -0
pdd/prompts/trace_LLM.prompt +25 -22
pdd/prompts/unfinished_prompt_LLM.prompt +85 -1
pdd/prompts/update_prompt_LLM.prompt +22 -1
pdd/pytest_output.py +127 -12
pdd/remote_session.py +876 -0
pdd/render_mermaid.py +236 -0
pdd/server/__init__.py +52 -0
pdd/server/app.py +335 -0
pdd/server/click_executor.py +587 -0
pdd/server/executor.py +338 -0
pdd/server/jobs.py +661 -0
pdd/server/models.py +241 -0
pdd/server/routes/__init__.py +31 -0
pdd/server/routes/architecture.py +451 -0
pdd/server/routes/auth.py +364 -0
pdd/server/routes/commands.py +929 -0
pdd/server/routes/config.py +42 -0
pdd/server/routes/files.py +603 -0
pdd/server/routes/prompts.py +1322 -0
pdd/server/routes/websocket.py +473 -0
pdd/server/security.py +243 -0
pdd/server/terminal_spawner.py +209 -0
pdd/server/token_counter.py +222 -0
pdd/setup_tool.py +648 -0
pdd/simple_math.py +2 -0
pdd/split_main.py +3 -2
pdd/summarize_directory.py +237 -195
pdd/sync_animation.py +8 -4
pdd/sync_determine_operation.py +839 -112
pdd/sync_main.py +351 -57
pdd/sync_orchestration.py +1400 -756
pdd/sync_tui.py +848 -0
pdd/template_expander.py +161 -0
pdd/template_registry.py +264 -0
pdd/templates/architecture/architecture_json.prompt +237 -0
pdd/templates/generic/generate_prompt.prompt +174 -0
pdd/trace.py +168 -12
pdd/trace_main.py +4 -3
pdd/track_cost.py +140 -63
pdd/unfinished_prompt.py +51 -4
pdd/update_main.py +567 -67
pdd/update_model_costs.py +2 -2
pdd/update_prompt.py +19 -4
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/METADATA +29 -11
pdd_cli-0.0.118.dist-info/RECORD +227 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/licenses/LICENSE +1 -1
pdd_cli-0.0.45.dist-info/RECORD +0 -116
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/WHEEL +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/entry_points.txt +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/top_level.txt +0 -0

pdd/preprocess.py CHANGED Viewed

@@ -1,37 +1,158 @@
 import os
 import re
+import base64
 import subprocess
-from typing import List, Optional
+from typing import List, Optional, Tuple
 import traceback
+from pathlib import Path
 from rich.console import Console
 from rich.panel import Panel
 from rich.markup import escape
 from rich.traceback import install
+from pdd.path_resolution import get_default_resolver
 install()
 console = Console()
+# Debug/Instrumentation controls
+_DEBUG_PREPROCESS = str(os.getenv("PDD_PREPROCESS_DEBUG", "")).lower() in ("1", "true", "yes", "on")
+_DEBUG_OUTPUT_FILE = os.getenv("PDD_PREPROCESS_DEBUG_FILE")  # Optional path to write a debug report
+_DEBUG_EVENTS: List[str] = []
+def _dbg(msg: str) -> None:
+    if _DEBUG_PREPROCESS:
+        console.print(f"[dim][PPD][preprocess][/dim] {escape(msg)}")
+        _DEBUG_EVENTS.append(msg)
+def _write_debug_report() -> None:
+    if _DEBUG_PREPROCESS and _DEBUG_OUTPUT_FILE:
+        try:
+            with open(_DEBUG_OUTPUT_FILE, "w", encoding="utf-8") as fh:
+                fh.write("Preprocess Debug Report\n\n")
+                for line in _DEBUG_EVENTS:
+                    fh.write(line + "\n")
+            console.print(f"[green]Debug report written to:[/green] {_DEBUG_OUTPUT_FILE}")
+        except Exception as e:
+            # Report the error so users know why the log file wasn't written
+            console.print(f"[yellow]Warning: Could not write debug report to {_DEBUG_OUTPUT_FILE}: {e}[/yellow]")
+    elif _DEBUG_PREPROCESS and not _DEBUG_OUTPUT_FILE:
+        console.print("[dim]Debug mode enabled but PDD_PREPROCESS_DEBUG_FILE not set (output shown in console only)[/dim]")
+def _extract_fence_spans(text: str) -> List[Tuple[int, int]]:
+    """Return list of (start, end) spans for fenced code blocks (``` or ~~~).
+    The spans are [start, end) indices in the original text.
+    """
+    spans: List[Tuple[int, int]] = []
+    try:
+        fence_re = re.compile(
+            r"(?m)^[ \t]*([`~]{3,})[^\n]*\n[\s\S]*?\n[ \t]*\1[ \t]*(?:\n|$)"
+        )
+        for m in fence_re.finditer(text):
+            spans.append((m.start(), m.end()))
+    except Exception:
+        pass
+    return spans
+def _extract_inline_code_spans(text: str) -> List[Tuple[int, int]]:
+    """Return list of (start, end) spans for inline code (backticks)."""
+    spans: List[Tuple[int, int]] = []
+    try:
+        for m in re.finditer(r"(?<!`)(`+)([^\n]*?)\1", text):
+            spans.append((m.start(), m.end()))
+    except Exception:
+        pass
+    return spans
+def _extract_code_spans(text: str) -> List[Tuple[int, int]]:
+    spans = _extract_fence_spans(text)
+    spans.extend(_extract_inline_code_spans(text))
+    return sorted(spans, key=lambda s: s[0])
+def _is_inside_any_span(idx: int, spans: List[Tuple[int, int]]) -> bool:
+    for s, e in spans:
+        if s <= idx < e:
+            return True
+    return False
+def _intersects_any_span(start: int, end: int, spans: List[Tuple[int, int]]) -> bool:
+    for s, e in spans:
+        if start < e and end > s:
+            return True
+    return False
+def _scan_risky_placeholders(text: str) -> Tuple[List[Tuple[int, str]], List[Tuple[int, str]]]:
+    """Scan for risky placeholders outside code fences.
+    Returns two lists of (line_no, snippet):
+      - single_brace: matches like {name} not doubled and not part of {{...}}
+      - template_brace: `${...}` occurrences (which include single { ... })
+    """
+    single_brace: List[Tuple[int, str]] = []
+    template_brace: List[Tuple[int, str]] = []
+    try:
+        fence_spans = _extract_fence_spans(text)
+        # Single-brace variable placeholders (avoid matching {{ or }})
+        for m in re.finditer(r"(?<!\{)\{([A-Za-z_][A-Za-z0-9_]*)\}(?!\})", text):
+            if not _is_inside_any_span(m.start(), fence_spans):
+                line_no = text.count("\n", 0, m.start()) + 1
+                single_brace.append((line_no, m.group(0)))
+        # JavaScript template placeholders like ${...}
+        for m in re.finditer(r"\$\{[^\}]+\}", text):
+            if not _is_inside_any_span(m.start(), fence_spans):
+                line_no = text.count("\n", 0, m.start()) + 1
+                template_brace.append((line_no, m.group(0)))
+    except Exception:
+        pass
+    return single_brace, template_brace
 def preprocess(prompt: str, recursive: bool = False, double_curly_brackets: bool = True, exclude_keys: Optional[List[str]] = None) -> str:
     try:
         if not prompt:
             console.print("[bold red]Error:[/bold red] Empty prompt provided")
             return ""
+        _DEBUG_EVENTS.clear()
+        _dbg(f"Start preprocess(recursive={recursive}, double_curly={double_curly_brackets}, exclude_keys={exclude_keys})")
+        _dbg(f"Initial length: {len(prompt)} characters")
         console.print(Panel("Starting prompt preprocessing", style="bold blue"))
         prompt = process_backtick_includes(prompt, recursive)
+        _dbg("After backtick includes processed")
         prompt = process_xml_tags(prompt, recursive)
+        _dbg("After XML-like tags processed")
         if double_curly_brackets:
             prompt = double_curly(prompt, exclude_keys)
+            _dbg("After double_curly execution")
+        # Scan for risky placeholders remaining outside code fences
+        singles, templates = _scan_risky_placeholders(prompt)
+        if singles:
+            _dbg(f"WARNING: Found {len(singles)} single-brace placeholders outside code fences (examples):")
+            for ln, frag in singles[:5]:
+                _dbg(f"  line {ln}: {frag}")
+        if templates:
+            _dbg(f"INFO: Found {len(templates)} template literals ${'{...'} outside code fences (examples):")
+            for ln, frag in templates[:5]:
+                _dbg(f"  line {ln}: {frag}")
         # Don't trim whitespace that might be significant for the tests
         console.print(Panel("Preprocessing complete", style="bold green"))
+        _dbg(f"Final length: {len(prompt)} characters")
+        _write_debug_report()
         return prompt
     except Exception as e:
         console.print(f"[bold red]Error during preprocessing:[/bold red] {str(e)}")
         console.print(Panel(traceback.format_exc(), title="Error Details", style="red"))
+        _dbg(f"Exception: {str(e)}")
+        _write_debug_report()
         return prompt
 def get_file_path(file_name: str) -> str:
-    base_path = './'
-    return os.path.join(base_path, file_name)
+    resolver = get_default_resolver()
+    resolved = resolver.resolve_include(file_name)
+    if not Path(file_name).is_absolute() and resolved == resolver.cwd / file_name:
+        return os.path.join("./", file_name)
+    return str(resolved)
 def process_backtick_includes(text: str, recursive: bool) -> str:
     # More specific pattern that doesn't match nested > characters
@@ -45,12 +166,17 @@ def process_backtick_includes(text: str, recursive: bool) -> str:
                 content = file.read()
                 if recursive:
                     content = preprocess(content, recursive=True, double_curly_brackets=False)
+                _dbg(f"Included via backticks: {file_path} (len={len(content)})")
                 return f"```{content}```"
         except FileNotFoundError:
             console.print(f"[bold red]Warning:[/bold red] File not found: {file_path}")
-            return match.group(0)
+            _dbg(f"Missing backtick include: {file_path}")
+            # First pass (recursive=True): leave the tag so a later env expansion can resolve it
+            # Second pass (recursive=False): replace with a visible placeholder
+            return match.group(0) if recursive else f"```[File not found: {file_path}]```"
         except Exception as e:
             console.print(f"[bold red]Error processing include:[/bold red] {str(e)}")
+            _dbg(f"Error processing backtick include {file_path}: {e}")
             return f"```[Error processing include: {file_path}]```"
     prev_text = ""
     current_text = text
@@ -62,9 +188,9 @@ def process_backtick_includes(text: str, recursive: bool) -> str:
 def process_xml_tags(text: str, recursive: bool) -> str:
     text = process_pdd_tags(text)
     text = process_include_tags(text, recursive)
-    text = process_shell_tags(text)
-    text = process_web_tags(text)
+    text = process_include_many_tags(text, recursive)
+    text = process_shell_tags(text, recursive)
+    text = process_web_tags(text, recursive)
     return text
 def process_include_tags(text: str, recursive: bool) -> str:
@@ -73,23 +199,74 @@ def process_include_tags(text: str, recursive: bool) -> str:
         file_path = match.group(1).strip()
         try:
             full_path = get_file_path(file_path)
-            console.print(f"Processing XML include: [cyan]{full_path}[/cyan]")
-            with open(full_path, 'r', encoding='utf-8') as file:
-                content = file.read()
-                if recursive:
-                    content = preprocess(content, recursive=True, double_curly_brackets=False)
-                return content
+            ext = os.path.splitext(file_path)[1].lower()
+            image_extensions = ['.png', '.jpg', '.jpeg', '.gif', '.webp', '.heic']
+            if ext in image_extensions:
+                console.print(f"Processing image include: [cyan]{full_path}[/cyan]")
+                from PIL import Image
+                import io
+                import pillow_heif
+                pillow_heif.register_heif_opener()
+                MAX_DIMENSION = 1024
+                with open(full_path, 'rb') as file:
+                    img = Image.open(file)
+                    img.load() # Force loading the image data before the file closes
+                    if img.width > MAX_DIMENSION or img.height > MAX_DIMENSION:
+                        img.thumbnail((MAX_DIMENSION, MAX_DIMENSION))
+                        console.print(f"Image resized to {img.size}")
+                # Handle GIFs: convert to a static PNG of the first frame
+                if ext == '.gif':
+                    img.seek(0)
+                    img = img.convert("RGB")
+                    img_format = 'PNG'
+                    mime_type = 'image/png'
+                elif ext == '.heic':
+                    img_format = 'JPEG'
+                    mime_type = 'image/jpeg'
+                else:
+                    img_format = 'JPEG' if ext in ['.jpg', '.jpeg'] else 'PNG'
+                    mime_type = f'image/{img_format.lower()}'
+                # Save the (potentially resized and converted) image to an in-memory buffer
+                buffer = io.BytesIO()
+                img.save(buffer, format=img_format)
+                content = buffer.getvalue()
+                encoded_string = base64.b64encode(content).decode('utf-8')
+                return f"data:{mime_type};base64,{encoded_string}"
+            else:
+                console.print(f"Processing XML include: [cyan]{full_path}[/cyan]")
+                with open(full_path, 'r', encoding='utf-8') as file:
+                    content = file.read()
+                    if recursive:
+                        content = preprocess(content, recursive=True, double_curly_brackets=False)
+                    _dbg(f"Included via XML tag: {file_path} (len={len(content)})")
+                    return content
         except FileNotFoundError:
             console.print(f"[bold red]Warning:[/bold red] File not found: {file_path}")
-            return f"[File not found: {file_path}]"
+            _dbg(f"Missing XML include: {file_path}")
+            # First pass (recursive=True): leave the tag so a later env expansion can resolve it
+            # Second pass (recursive=False): replace with a visible placeholder
+            return match.group(0) if recursive else f"[File not found: {file_path}]"
         except Exception as e:
             console.print(f"[bold red]Error processing include:[/bold red] {str(e)}")
+            _dbg(f"Error processing XML include {file_path}: {e}")
             return f"[Error processing include: {file_path}]"
     prev_text = ""
     current_text = text
     while prev_text != current_text:
         prev_text = current_text
-        current_text = re.sub(pattern, replace_include, current_text, flags=re.DOTALL)
+        code_spans = _extract_code_spans(current_text)
+        def replace_include_with_spans(match):
+            if _intersects_any_span(match.start(), match.end(), code_spans):
+                return match.group(0)
+            return replace_include(match)
+        current_text = re.sub(pattern, replace_include_with_spans, current_text, flags=re.DOTALL)
     return current_text
 def process_pdd_tags(text: str) -> str:
@@ -101,54 +278,120 @@ def process_pdd_tags(text: str) -> str:
         return "This is a test "
     return processed
-def process_shell_tags(text: str) -> str:
+def process_shell_tags(text: str, recursive: bool) -> str:
     pattern = r'<shell>(.*?)</shell>'
     def replace_shell(match):
         command = match.group(1).strip()
+        if recursive:
+            # Defer execution until after env var expansion
+            return match.group(0)
         console.print(f"Executing shell command: [cyan]{escape(command)}[/cyan]")
+        _dbg(f"Shell tag command: {command}")
         try:
             result = subprocess.run(command, shell=True, check=True, capture_output=True, text=True)
             return result.stdout
         except subprocess.CalledProcessError as e:
             error_msg = f"Command '{command}' returned non-zero exit status {e.returncode}."
             console.print(f"[bold red]Error:[/bold red] {error_msg}")
+            _dbg(f"Shell command error: {error_msg}")
             return f"Error: {error_msg}"
         except Exception as e:
             console.print(f"[bold red]Error executing shell command:[/bold red] {str(e)}")
+            _dbg(f"Shell execution exception: {e}")
             return f"[Shell execution error: {str(e)}]"
-    return re.sub(pattern, replace_shell, text, flags=re.DOTALL)
+    code_spans = _extract_code_spans(text)
+    def replace_shell_with_spans(match):
+        if _intersects_any_span(match.start(), match.end(), code_spans):
+            return match.group(0)
+        return replace_shell(match)
+    return re.sub(pattern, replace_shell_with_spans, text, flags=re.DOTALL)
-def process_web_tags(text: str) -> str:
+def process_web_tags(text: str, recursive: bool) -> str:
     pattern = r'<web>(.*?)</web>'
     def replace_web(match):
         url = match.group(1).strip()
+        if recursive:
+            # Defer network operations until after env var expansion
+            return match.group(0)
         console.print(f"Scraping web content from: [cyan]{url}[/cyan]")
+        _dbg(f"Web tag URL: {url}")
         try:
             try:
-                from firecrawl import FirecrawlApp
+                from firecrawl import Firecrawl
             except ImportError:
+                _dbg("firecrawl import failed; package not installed")
                 return f"[Error: firecrawl-py package not installed. Cannot scrape {url}]"
             api_key = os.environ.get('FIRECRAWL_API_KEY')
             if not api_key:
                 console.print("[bold yellow]Warning:[/bold yellow] FIRECRAWL_API_KEY not found in environment")
+                _dbg("FIRECRAWL_API_KEY not set")
                 return f"[Error: FIRECRAWL_API_KEY not set. Cannot scrape {url}]"
-            app = FirecrawlApp(api_key=api_key)
-            response = app.scrape_url(url, formats=['markdown'])
-            if hasattr(response, 'markdown'):
+            app = Firecrawl(api_key=api_key)
+            response = app.scrape(url, formats=['markdown'])
+            # Handle both dict response (new API) and object response (legacy)
+            if isinstance(response, dict) and 'markdown' in response:
+                _dbg(f"Web scrape returned markdown (len={len(response['markdown'])})")
+                return response['markdown']
+            elif hasattr(response, 'markdown'):
+                _dbg(f"Web scrape returned markdown (len={len(response.markdown)})")
                 return response.markdown
             else:
                 console.print(f"[bold yellow]Warning:[/bold yellow] No markdown content returned for {url}")
+                _dbg("Web scrape returned no markdown content")
                 return f"[No content available for {url}]"
         except Exception as e:
             console.print(f"[bold red]Error scraping web content:[/bold red] {str(e)}")
+            _dbg(f"Web scraping exception: {e}")
             return f"[Web scraping error: {str(e)}]"
-    return re.sub(pattern, replace_web, text, flags=re.DOTALL)
+    code_spans = _extract_code_spans(text)
+    def replace_web_with_spans(match):
+        if _intersects_any_span(match.start(), match.end(), code_spans):
+            return match.group(0)
+        return replace_web(match)
+    return re.sub(pattern, replace_web_with_spans, text, flags=re.DOTALL)
+def process_include_many_tags(text: str, recursive: bool) -> str:
+    """Process <include-many> blocks whose inner content is a comma- or newline-separated
+    list of file paths (typically provided via variables after env expansion)."""
+    pattern = r'<include-many>(.*?)</include-many>'
+    def replace_many(match):
+        inner = match.group(1)
+        if recursive:
+            # Wait for env expansion to materialize the list
+            return match.group(0)
+        # Split by newlines or commas
+        raw_items = [s.strip() for part in inner.split('\n') for s in part.split(',')]
+        paths = [p for p in raw_items if p]
+        contents: list[str] = []
+        for p in paths:
+            try:
+                full_path = get_file_path(p)
+                console.print(f"Including (many): [cyan]{full_path}[/cyan]")
+                with open(full_path, 'r', encoding='utf-8') as fh:
+                    contents.append(fh.read())
+                _dbg(f"Included (many): {p}")
+            except FileNotFoundError:
+                console.print(f"[bold red]Warning:[/bold red] File not found: {p}")
+                _dbg(f"Missing include-many: {p}")
+                contents.append(f"[File not found: {p}]")
+            except Exception as e:
+                console.print(f"[bold red]Error processing include-many:[/bold red] {str(e)}")
+                _dbg(f"Error processing include-many {p}: {e}")
+                contents.append(f"[Error processing include: {p}]")
+        return "\n".join(contents)
+    code_spans = _extract_code_spans(text)
+    def replace_many_with_spans(match):
+        if _intersects_any_span(match.start(), match.end(), code_spans):
+            return match.group(0)
+        return replace_many(match)
+    return re.sub(pattern, replace_many_with_spans, text, flags=re.DOTALL)
 def double_curly(text: str, exclude_keys: Optional[List[str]] = None) -> str:
     if exclude_keys is None:
         exclude_keys = []
     console.print("Doubling curly brackets...")
+    _dbg("double_curly invoked")
     # Special case handling for specific test patterns
     if "Mix of {excluded{inner}} nesting" in text and "excluded" in exclude_keys:
@@ -172,6 +415,14 @@ def double_curly(text: str, exclude_keys: Optional[List[str]] = None) -> str:
             "2": {{"id": "2", "name": "Resource Two"}}
         }}"""
+    # Protect ${IDENT} placeholders so we can safely double braces, then restore
+    # them as ${{IDENT}} to avoid PromptTemplate interpreting {IDENT}.
+    protected_vars: List[str] = []
+    def _protect_var(m):
+        protected_vars.append(m.group(0))
+        return f"__PDD_VAR_{len(protected_vars)-1}__"
+    text = re.sub(r"\$\{[A-Za-z_][A-Za-z0-9_]*\}", _protect_var, text)
     # First, protect any existing double curly braces
     text = re.sub(r'\{\{([^{}]*)\}\}', r'__ALREADY_DOUBLED__\1__END_ALREADY__', text)
@@ -188,6 +439,24 @@ def double_curly(text: str, exclude_keys: Optional[List[str]] = None) -> str:
     # Restore already doubled brackets
     text = re.sub(r'__ALREADY_DOUBLED__(.*?)__END_ALREADY__', r'{{\1}}', text)
+    # Restore protected ${IDENT} placeholders as ${{IDENT}} so single braces
+    # don't leak into PromptTemplate formatting. This is safe for JS template
+    # literals and prevents missing-key errors in later formatting steps.
+    def _restore_var(m):
+        idx = int(m.group(1))
+        if 0 <= idx < len(protected_vars):
+            original = protected_vars[idx]  # e.g., ${FOO}
+            try:
+                inner = re.match(r"\$\{([A-Za-z_][A-Za-z0-9_]*)\}", original)
+                if inner:
+                    # Build as concatenation to avoid f-string brace escaping confusion
+                    return "${{" + inner.group(1) + "}}"  # -> ${{FOO}}
+            except Exception:
+                pass
+            return original
+        return m.group(0)
+    text = re.sub(r"__PDD_VAR_(\d+)__", _restore_var, text)
     # Special handling for code blocks
     code_block_pattern = r'```([\w\s]*)\n([\s\S]*?)```'
@@ -213,4 +482,4 @@ def double_curly(text: str, exclude_keys: Optional[List[str]] = None) -> str:
     # Process code blocks
     text = re.sub(code_block_pattern, process_code_block, text, flags=re.DOTALL)
-    return text
+    return text

pdd/preprocess_main.py CHANGED Viewed

@@ -1,15 +1,23 @@
 import csv
 import sys
+from pathlib import Path
 from typing import Tuple, Optional
 import click
 from rich import print as rprint
+from .config_resolution import resolve_effective_config
 from .construct_paths import construct_paths
 from .preprocess import preprocess
 from .xml_tagger import xml_tagger
-from . import DEFAULT_TIME, DEFAULT_STRENGTH
+from .architecture_sync import (
+    get_architecture_entry_for_prompt,
+    generate_tags_from_architecture,
+    has_pdd_tags,
+)
 def preprocess_main(
-    ctx: click.Context, prompt_file: str, output: Optional[str], xml: bool, recursive: bool, double: bool, exclude: list
+    ctx: click.Context, prompt_file: str, output: Optional[str], xml: bool, recursive: bool, double: bool, exclude: list, pdd_tags: bool = False
 ) -> Tuple[str, float, str]:
     """
     CLI wrapper for preprocessing prompts.
@@ -22,6 +30,7 @@ def preprocess_main(
     :param double: If True, curly brackets will be doubled.
     :param exclude: List of keys to exclude from curly bracket doubling.
     :return: Tuple containing the preprocessed prompt, total cost, and model name used.
+    :param pdd_tags: If True, inject PDD metadata tags from architecture.json.
     """
     try:
         # Construct file paths
@@ -33,17 +42,41 @@ def preprocess_main(
             quiet=ctx.obj.get("quiet", False),
             command="preprocess",
             command_options=command_options,
+            context_override=ctx.obj.get('context')
         )
         # Load prompt file
         prompt = input_strings["prompt_file"]
+        # Inject PDD metadata tags from architecture.json if requested
+        pdd_tags_injected = False
+        if pdd_tags:
+            prompt_filename = Path(prompt_file).name
+            arch_entry = get_architecture_entry_for_prompt(prompt_filename)
+            if arch_entry:
+                if has_pdd_tags(prompt):
+                    if not ctx.obj.get("quiet", False):
+                        rprint(f"[yellow]Prompt already has PDD tags, skipping injection.[/yellow]")
+                else:
+                    generated_tags = generate_tags_from_architecture(arch_entry)
+                    if generated_tags:
+                        prompt = generated_tags + '\n\n' + prompt
+                        pdd_tags_injected = True
+                        if not ctx.obj.get("quiet", False):
+                            rprint(f"[green]Injected PDD tags from architecture.json[/green]")
+            else:
+                if not ctx.obj.get("quiet", False):
+                    rprint(f"[yellow]No architecture entry found for '{prompt_filename}', skipping PDD tags.[/yellow]")
         if xml:
             # Use xml_tagger to add XML delimiters
-            strength = ctx.obj.get("strength", DEFAULT_STRENGTH)
-            temperature = ctx.obj.get("temperature", 0.0)
+            # Use centralized config resolution with proper priority: CLI > pddrc > defaults
+            effective_config = resolve_effective_config(ctx, resolved_config)
+            strength = effective_config["strength"]
+            temperature = effective_config["temperature"]
+            time = effective_config["time"]
             verbose = ctx.obj.get("verbose", False)
-            time = ctx.obj.get("time", DEFAULT_TIME)
             xml_tagged, total_cost, model_name = xml_tagger(
                 prompt,
                 strength,
@@ -64,6 +97,8 @@ def preprocess_main(
         # Provide user feedback
         if not ctx.obj.get("quiet", False):
             rprint("[bold green]Prompt preprocessing completed successfully.[/bold green]")
+            if pdd_tags_injected:
+                rprint("[bold]PDD metadata tags: injected from architecture.json[/bold]")
             if xml:
                 rprint(f"[bold]XML Tagging used: {model_name}[/bold]")
             else:
@@ -76,4 +111,4 @@ def preprocess_main(
     except Exception as e:
         if not ctx.obj.get("quiet", False):
             rprint(f"[bold red]Error during preprocessing:[/bold red] {e}")
-        sys.exit(1)
+        sys.exit(1)

pdd-cli 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl