PyPI - pdd-cli - Versions diffs - 0.0.42__py3-none-any.whl → 0.0.90__py3-none-any.whl - Mend

pdd-cli 0.0.42py3-none-any.whl → 0.0.90py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

pdd/__init__.py +4 -4
pdd/agentic_common.py +863 -0
pdd/agentic_crash.py +534 -0
pdd/agentic_fix.py +1179 -0
pdd/agentic_langtest.py +162 -0
pdd/agentic_update.py +370 -0
pdd/agentic_verify.py +183 -0
pdd/auto_deps_main.py +15 -5
pdd/auto_include.py +63 -5
pdd/bug_main.py +3 -2
pdd/bug_to_unit_test.py +2 -0
pdd/change_main.py +11 -4
pdd/cli.py +22 -1181
pdd/cmd_test_main.py +80 -19
pdd/code_generator.py +58 -18
pdd/code_generator_main.py +672 -25
pdd/commands/__init__.py +42 -0
pdd/commands/analysis.py +248 -0
pdd/commands/fix.py +140 -0
pdd/commands/generate.py +257 -0
pdd/commands/maintenance.py +174 -0
pdd/commands/misc.py +79 -0
pdd/commands/modify.py +230 -0
pdd/commands/report.py +144 -0
pdd/commands/templates.py +215 -0
pdd/commands/utility.py +110 -0
pdd/config_resolution.py +58 -0
pdd/conflicts_main.py +8 -3
pdd/construct_paths.py +281 -81
pdd/context_generator.py +10 -2
pdd/context_generator_main.py +113 -11
pdd/continue_generation.py +47 -7
pdd/core/__init__.py +0 -0
pdd/core/cli.py +503 -0
pdd/core/dump.py +554 -0
pdd/core/errors.py +63 -0
pdd/core/utils.py +90 -0
pdd/crash_main.py +44 -11
pdd/data/language_format.csv +71 -62
pdd/data/llm_model.csv +20 -18
pdd/detect_change_main.py +5 -4
pdd/fix_code_loop.py +331 -77
pdd/fix_error_loop.py +209 -60
pdd/fix_errors_from_unit_tests.py +4 -3
pdd/fix_main.py +75 -18
pdd/fix_verification_errors.py +12 -100
pdd/fix_verification_errors_loop.py +319 -272
pdd/fix_verification_main.py +57 -17
pdd/generate_output_paths.py +93 -10
pdd/generate_test.py +16 -5
pdd/get_jwt_token.py +48 -9
pdd/get_run_command.py +73 -0
pdd/get_test_command.py +68 -0
pdd/git_update.py +70 -19
pdd/increase_tests.py +7 -0
pdd/incremental_code_generator.py +2 -2
pdd/insert_includes.py +11 -3
pdd/llm_invoke.py +1278 -110
pdd/load_prompt_template.py +36 -10
pdd/pdd_completion.fish +25 -2
pdd/pdd_completion.sh +30 -4
pdd/pdd_completion.zsh +79 -4
pdd/postprocess.py +10 -3
pdd/preprocess.py +228 -15
pdd/preprocess_main.py +8 -5
pdd/prompts/agentic_crash_explore_LLM.prompt +49 -0
pdd/prompts/agentic_fix_explore_LLM.prompt +45 -0
pdd/prompts/agentic_fix_harvest_only_LLM.prompt +48 -0
pdd/prompts/agentic_fix_primary_LLM.prompt +85 -0
pdd/prompts/agentic_update_LLM.prompt +1071 -0
pdd/prompts/agentic_verify_explore_LLM.prompt +45 -0
pdd/prompts/auto_include_LLM.prompt +98 -101
pdd/prompts/change_LLM.prompt +1 -3
pdd/prompts/detect_change_LLM.prompt +562 -3
pdd/prompts/example_generator_LLM.prompt +22 -1
pdd/prompts/extract_code_LLM.prompt +5 -1
pdd/prompts/extract_program_code_fix_LLM.prompt +14 -2
pdd/prompts/extract_prompt_update_LLM.prompt +7 -8
pdd/prompts/extract_promptline_LLM.prompt +17 -11
pdd/prompts/find_verification_errors_LLM.prompt +6 -0
pdd/prompts/fix_code_module_errors_LLM.prompt +16 -4
pdd/prompts/fix_errors_from_unit_tests_LLM.prompt +6 -41
pdd/prompts/fix_verification_errors_LLM.prompt +22 -0
pdd/prompts/generate_test_LLM.prompt +21 -6
pdd/prompts/increase_tests_LLM.prompt +1 -2
pdd/prompts/insert_includes_LLM.prompt +1181 -6
pdd/prompts/split_LLM.prompt +1 -62
pdd/prompts/trace_LLM.prompt +25 -22
pdd/prompts/unfinished_prompt_LLM.prompt +85 -1
pdd/prompts/update_prompt_LLM.prompt +22 -1
pdd/prompts/xml_convertor_LLM.prompt +3246 -7
pdd/pytest_output.py +188 -21
pdd/python_env_detector.py +151 -0
pdd/render_mermaid.py +236 -0
pdd/setup_tool.py +648 -0
pdd/simple_math.py +2 -0
pdd/split_main.py +3 -2
pdd/summarize_directory.py +56 -7
pdd/sync_determine_operation.py +918 -186
pdd/sync_main.py +82 -32
pdd/sync_orchestration.py +1456 -453
pdd/sync_tui.py +848 -0
pdd/template_registry.py +264 -0
pdd/templates/architecture/architecture_json.prompt +242 -0
pdd/templates/generic/generate_prompt.prompt +174 -0
pdd/trace.py +168 -12
pdd/trace_main.py +4 -3
pdd/track_cost.py +151 -61
pdd/unfinished_prompt.py +49 -3
pdd/update_main.py +549 -67
pdd/update_model_costs.py +2 -2
pdd/update_prompt.py +19 -4
{pdd_cli-0.0.42.dist-info → pdd_cli-0.0.90.dist-info}/METADATA +20 -7
pdd_cli-0.0.90.dist-info/RECORD +153 -0
{pdd_cli-0.0.42.dist-info → pdd_cli-0.0.90.dist-info}/licenses/LICENSE +1 -1
pdd_cli-0.0.42.dist-info/RECORD +0 -115
{pdd_cli-0.0.42.dist-info → pdd_cli-0.0.90.dist-info}/WHEEL +0 -0
{pdd_cli-0.0.42.dist-info → pdd_cli-0.0.90.dist-info}/entry_points.txt +0 -0
{pdd_cli-0.0.42.dist-info → pdd_cli-0.0.90.dist-info}/top_level.txt +0 -0

pdd/code_generator_main.py CHANGED Viewed

@@ -1,10 +1,13 @@
 import os
+import re
 import asyncio
 import json
 import pathlib
 import shlex
 import subprocess
 import requests
+import tempfile
+import sys
 from typing import Optional, Tuple, Dict, Any, List
 import click
@@ -19,6 +22,7 @@ from .preprocess import preprocess as pdd_preprocess
 from .code_generator import code_generator as local_code_generator_func
 from .incremental_code_generator import incremental_code_generator as incremental_code_generator_func
 from .get_jwt_token import get_jwt_token, AuthError, NetworkError, TokenError, UserCancelledError, RateLimitError
+from .python_env_detector import detect_host_python_executable
 # Environment variable names for Firebase/GitHub auth
 FIREBASE_API_KEY_ENV_VAR = "NEXT_PUBLIC_FIREBASE_API_KEY"
@@ -31,6 +35,17 @@ CLOUD_REQUEST_TIMEOUT = 400  # seconds
 console = Console()
+# --- Helper Functions ---
+def _parse_llm_bool(value: str) -> bool:
+    """Parse LLM boolean value from string."""
+    if not value:
+        return True
+    llm_str = str(value).strip().lower()
+    if llm_str in {"0", "false", "no", "off"}:
+        return False
+    else:
+        return llm_str in {"1", "true", "yes", "on"}
 # --- Git Helper Functions ---
 def _run_git_command(command: List[str], cwd: Optional[str] = None) -> Tuple[int, str, str]:
     """Runs a git command and returns (return_code, stdout, stderr)."""
@@ -59,6 +74,102 @@ def is_git_repository(path: Optional[str] = None) -> bool:
     return False
+def _expand_vars(text: str, vars_map: Optional[Dict[str, str]]) -> str:
+    """Replace $KEY and ${KEY} in text when KEY exists in vars_map. Leave others unchanged."""
+    if not text or not vars_map:
+        return text
+    def repl_braced(m: re.Match) -> str:
+        key = m.group(1)
+        return vars_map.get(key, m.group(0))
+    def repl_simple(m: re.Match) -> str:
+        key = m.group(1)
+        return vars_map.get(key, m.group(0))
+    # Replace ${KEY} first, then $KEY
+    text = re.sub(r"\$\{([A-Za-z_][A-Za-z0-9_]*)\}", repl_braced, text)
+    text = re.sub(r"\$([A-Za-z_][A-Za-z0-9_]*)", repl_simple, text)
+    return text
+def _parse_front_matter(text: str) -> Tuple[Optional[Dict[str, Any]], str]:
+    """Parse YAML front matter at the start of a prompt and return (meta, body)."""
+    try:
+        if not text.startswith("---\n"):
+            return None, text
+        end_idx = text.find("\n---", 4)
+        if end_idx == -1:
+            return None, text
+        fm_body = text[4:end_idx]
+        rest = text[end_idx + len("\n---"):]
+        if rest.startswith("\n"):
+            rest = rest[1:]
+        import yaml as _yaml
+        meta = _yaml.safe_load(fm_body) or {}
+        if not isinstance(meta, dict):
+            meta = {}
+        return meta, rest
+    except Exception:
+        return None, text
+def _is_architecture_template(meta: Optional[Dict[str, Any]]) -> bool:
+    """Detect the packaged architecture JSON template via its front matter name."""
+    return isinstance(meta, dict) and meta.get("name") == "architecture/architecture_json"
+def _repair_architecture_interface_types(payload: Any) -> Tuple[Any, bool]:
+    """
+    Patch common LLM slip-ups for the architecture template where interface.type
+    occasionally returns an unsupported value like "object". Only normalizes the
+    interface.type field and leaves other schema issues untouched so validation
+    still fails for genuinely malformed outputs.
+    """
+    allowed_types = {
+        "component",
+        "page",
+        "module",
+        "api",
+        "graphql",
+        "cli",
+        "job",
+        "message",
+        "config",
+    }
+    changed = False
+    if not isinstance(payload, list):
+        return payload, changed
+    for entry in payload:
+        if not isinstance(entry, dict):
+            continue
+        interface = entry.get("interface")
+        if not isinstance(interface, dict):
+            continue
+        raw_type = interface.get("type")
+        normalized = raw_type.lower() if isinstance(raw_type, str) else None
+        if normalized in allowed_types:
+            if normalized != raw_type:
+                interface["type"] = normalized
+                changed = True
+            continue
+        inferred_type = None
+        for key in ("page", "component", "module", "api", "graphql", "cli", "job", "message", "config"):
+            if isinstance(interface.get(key), dict):
+                inferred_type = key
+                break
+        if inferred_type is None:
+            inferred_type = "module"
+        if raw_type != inferred_type:
+            interface["type"] = inferred_type
+            changed = True
+    return payload, changed
 def get_git_content_at_ref(file_path: str, git_ref: str = "HEAD") -> Optional[str]:
     """Gets the content of the file as it was at the specified git_ref."""
     abs_file_path = pathlib.Path(file_path).resolve()
@@ -124,6 +235,28 @@ def git_add_files(file_paths: List[str], verbose: bool = False) -> bool:
         return False
 # --- End Git Helper Functions ---
+def _find_default_test_files(tests_dir: Optional[str], code_file_path: Optional[str]) -> List[str]:
+    """Find default test files for a given code file in the tests directory."""
+    if not tests_dir or not code_file_path:
+        return []
+    tests_path = pathlib.Path(tests_dir)
+    code_path = pathlib.Path(code_file_path)
+    if not tests_path.exists() or not tests_path.is_dir():
+        return []
+    code_stem = code_path.stem
+    code_suffix = code_path.suffix
+    # Look for files starting with test_{code_stem}
+    # We look for test_{code_stem}*.{code_suffix}
+    # e.g., hello.py -> test_hello.py, test_hello_1.py
+    pattern = f"test_{code_stem}*{code_suffix}"
+    found_files = list(tests_path.glob(pattern))
+    return [str(p) for p in sorted(found_files)]
 def code_generator_main(
     ctx: click.Context,
@@ -131,6 +264,9 @@ def code_generator_main(
     output: Optional[str],
     original_prompt_file_path: Optional[str],
     force_incremental_flag: bool,
+    env_vars: Optional[Dict[str, str]] = None,
+    unit_test_file: Optional[str] = None,
+    exclude_tests: bool = False,
 ) -> Tuple[str, bool, float, str]:
     """
     CLI wrapper for generating code from prompts. Handles full and incremental generation,
@@ -157,20 +293,97 @@ def code_generator_main(
     command_options: Dict[str, Any] = {"output": output}
     try:
+        # Read prompt content once to determine LLM state and for construct_paths
+        with open(prompt_file, 'r', encoding='utf-8') as f:
+            raw_prompt_content = f.read()
+        # Phase-2 templates: parse front matter metadata
+        fm_meta, body = _parse_front_matter(raw_prompt_content)
+        if fm_meta:
+            prompt_content = body
+        else:
+            prompt_content = raw_prompt_content
+        # Determine LLM state early to avoid unnecessary overwrite prompts
+        llm_enabled: bool = True
+        env_llm_raw = None
+        try:
+            if env_vars and 'llm' in env_vars:
+                env_llm_raw = str(env_vars.get('llm'))
+            elif os.environ.get('llm') is not None:
+                env_llm_raw = os.environ.get('llm')
+            elif os.environ.get('LLM') is not None:
+                env_llm_raw = os.environ.get('LLM')
+        except Exception:
+            env_llm_raw = None
+        # Environment variables should override front matter
+        if env_llm_raw is not None:
+            llm_enabled = _parse_llm_bool(env_llm_raw)
+        elif fm_meta and isinstance(fm_meta, dict) and 'llm' in fm_meta:
+            llm_enabled = bool(fm_meta.get('llm', True))
+        # else: keep default True
+        # If LLM is disabled, we're only doing post-processing, so skip overwrite confirmation
+        effective_force = force_overwrite or not llm_enabled
         resolved_config, input_strings, output_file_paths, language = construct_paths(
             input_file_paths=input_file_paths_dict,
-            force=force_overwrite,
+            force=effective_force,
             quiet=quiet,
             command="generate",
             command_options=command_options,
+            context_override=ctx.obj.get('context'),
+            confirm_callback=cli_params.get('confirm_callback')
         )
-        prompt_content = input_strings["prompt_file"]
-        # Prioritize orchestration output path over construct_paths result
-        output_path = output or output_file_paths.get("output")
+        # Determine final output path: if user passed a directory, use resolved file path
+        resolved_output = output_file_paths.get("output")
+        if output is None:
+            output_path = resolved_output
+        else:
+            try:
+                is_dir_hint = output.endswith(os.path.sep) or output.endswith("/")
+            except Exception:
+                is_dir_hint = False
+            if is_dir_hint or os.path.isdir(output):
+                output_path = resolved_output
+            else:
+                output_path = output
+        # --- Unit Test Inclusion Logic ---
+        test_files_to_include: List[str] = []
+        if unit_test_file:
+            test_files_to_include.append(unit_test_file)
+        elif not exclude_tests:
+            # Try to find default test files
+            tests_dir = resolved_config.get("tests_dir")
+            found_tests = _find_default_test_files(tests_dir, output_path)
+            if found_tests:
+                if verbose:
+                    console.print(f"[info]Found default test files: {', '.join(found_tests)}[/info]")
+                test_files_to_include.extend(found_tests)
+        if test_files_to_include:
+            prompt_content += "\n\n<unit_test_content>\n"
+            prompt_content += "The following is the unit test content that the generated code must pass:\n"
+            for tf in test_files_to_include:
+                try:
+                    with open(tf, 'r', encoding='utf-8') as f:
+                        content = f.read()
+                    # If multiple files, label them? Or just concat?
+                    # Using code block with file path comment is safer for context.
+                    prompt_content += f"\nFile: {pathlib.Path(tf).name}\n```python\n{content}\n```\n"
+                except Exception as e:
+                    console.print(f"[yellow]Warning: Could not read unit test file {tf}: {e}[/yellow]")
+            prompt_content += "</unit_test_content>\n"
+        # ---------------------------------
     except FileNotFoundError as e:
         console.print(f"[red]Error: Input file not found: {e.filename}[/red]")
         return "", False, 0.0, "error"
+    except click.Abort:
+        # User cancelled - re-raise to stop the sync loop
+        raise
     except Exception as e:
         console.print(f"[red]Error during path construction: {e}[/red]")
         return "", False, 0.0, "error"
@@ -179,6 +392,108 @@ def code_generator_main(
     existing_code_content: Optional[str] = None
     original_prompt_content_for_incremental: Optional[str] = None
+    # Merge -e vars with front-matter defaults; validate required
+    if env_vars is None:
+        env_vars = {}
+    if fm_meta and isinstance(fm_meta.get("variables"), dict):
+        for k, spec in (fm_meta["variables"].items()):
+            if isinstance(spec, dict):
+                if k not in env_vars and "default" in spec:
+                    env_vars[k] = str(spec["default"])
+            # if scalar default allowed, ignore for now
+        missing = [k for k, spec in fm_meta["variables"].items() if isinstance(spec, dict) and spec.get("required") and k not in env_vars]
+        if missing:
+            console.print(f"[error]Missing required variables: {', '.join(missing)}")
+            return "", False, 0.0, "error"
+    # Execute optional discovery from front matter to populate env_vars without overriding explicit -e values
+    def _run_discovery(discover_cfg: Dict[str, Any]) -> Dict[str, str]:
+        results: Dict[str, str] = {}
+        try:
+            if not discover_cfg:
+                return results
+            enabled = discover_cfg.get("enabled", False)
+            if not enabled:
+                return results
+            root = discover_cfg.get("root", ".")
+            patterns = discover_cfg.get("patterns", []) or []
+            exclude = discover_cfg.get("exclude", []) or []
+            max_per = int(discover_cfg.get("max_per_pattern", 0) or 0)
+            max_total = int(discover_cfg.get("max_total", 0) or 0)
+            root_path = pathlib.Path(root).resolve()
+            seen: List[str] = []
+            def _match_one(patterns_list: List[str]) -> List[str]:
+                matches: List[str] = []
+                for pat in patterns_list:
+                    globbed = list(root_path.rglob(pat))
+                    for p in globbed:
+                        if any(p.match(ex) for ex in exclude):
+                            continue
+                        sp = str(p.resolve())
+                        if sp not in matches:
+                            matches.append(sp)
+                    if max_per and len(matches) >= max_per:
+                        matches = matches[:max_per]
+                        break
+                return matches
+            # If a mapping 'set' is provided, compute per-variable results
+            set_map = discover_cfg.get("set") or {}
+            if isinstance(set_map, dict) and set_map:
+                for var_name, spec in set_map.items():
+                    if var_name in env_vars:
+                        continue  # don't override explicit -e
+                    v_patterns = spec.get("patterns", []) if isinstance(spec, dict) else []
+                    v_exclude = spec.get("exclude", []) if isinstance(spec, dict) else []
+                    save_exclude = exclude
+                    try:
+                        if v_exclude:
+                            exclude = v_exclude
+                        matches = _match_one(v_patterns or patterns)
+                    finally:
+                        exclude = save_exclude
+                    if matches:
+                        results[var_name] = ",".join(matches)
+                        seen.extend(matches)
+            # Fallback: populate SCAN_FILES and SCAN metadata
+            if not results:
+                files = _match_one(patterns)
+                if max_total and len(files) > max_total:
+                    files = files[:max_total]
+                if files:
+                    results["SCAN_FILES"] = ",".join(files)
+            # Always set root/patterns helpers
+            if root:
+                results.setdefault("SCAN_ROOT", str(root_path))
+            if patterns:
+                results.setdefault("SCAN_PATTERNS", ",".join(patterns))
+        except Exception as e:
+            if verbose and not quiet:
+                console.print(f"[yellow]Discovery skipped due to error: {e}[/yellow]")
+        return results
+    if fm_meta and isinstance(fm_meta.get("discover"), dict):
+        discovered = _run_discovery(fm_meta.get("discover") or {})
+        for k, v in discovered.items():
+            if k not in env_vars:
+                env_vars[k] = v
+    # Expand variables in output path if provided
+    if output_path:
+        output_path = _expand_vars(output_path, env_vars)
+    # Honor front-matter output when CLI did not pass --output
+    if output is None and fm_meta and isinstance(fm_meta.get("output"), str):
+        try:
+            meta_out = _expand_vars(fm_meta["output"], env_vars)
+            if meta_out:
+                output_path = str(pathlib.Path(meta_out).resolve())
+        except Exception:
+            pass
+    # Honor front-matter language if provided (overrides detection for both local and cloud)
+    if fm_meta and isinstance(fm_meta.get("language"), str) and fm_meta.get("language"):
+        language = fm_meta.get("language")
     if output_path and pathlib.Path(output_path).exists():
         try:
             existing_code_content = pathlib.Path(output_path).read_text(encoding="utf-8")
@@ -303,7 +618,96 @@ def code_generator_main(
         can_attempt_incremental = False
     try:
-        if can_attempt_incremental and existing_code_content is not None and original_prompt_content_for_incremental is not None:
+        # Resolve post-process script from env/CLI override, then front matter, then sensible default per template
+        post_process_script: Optional[str] = None
+        prompt_body_for_script: str = prompt_content
+        if verbose:
+            console.print(f"[blue]LLM enabled:[/blue] {llm_enabled}")
+        try:
+            post_process_script = None
+            script_override = None
+            if env_vars:
+                script_override = env_vars.get('POST_PROCESS_PYTHON') or env_vars.get('post_process_python')
+            if not script_override:
+                script_override = os.environ.get('POST_PROCESS_PYTHON') or os.environ.get('post_process_python')
+            if script_override and str(script_override).strip():
+                expanded = _expand_vars(str(script_override), env_vars)
+                pkg_dir = pathlib.Path(__file__).parent.resolve()
+                repo_root = pathlib.Path.cwd().resolve()
+                repo_pdd_dir = (repo_root / 'pdd').resolve()
+                candidate = pathlib.Path(expanded)
+                if not candidate.is_absolute():
+                    # 1) As provided, relative to CWD
+                    as_is = (repo_root / candidate)
+                    # 2) Under repo pdd/
+                    under_repo_pdd = (repo_pdd_dir / candidate.name) if not as_is.exists() else as_is
+                    # 3) Under installed package dir
+                    under_pkg = (pkg_dir / candidate.name) if not as_is.exists() and not under_repo_pdd.exists() else as_is
+                    if as_is.exists():
+                        candidate = as_is
+                    elif under_repo_pdd.exists():
+                        candidate = under_repo_pdd
+                    elif under_pkg.exists():
+                        candidate = under_pkg
+                    else:
+                        candidate = as_is  # will fail later with not found
+                post_process_script = str(candidate.resolve())
+            elif fm_meta and isinstance(fm_meta, dict):
+                raw_script = fm_meta.get('post_process_python')
+                if isinstance(raw_script, str) and raw_script.strip():
+                    # Expand variables like $VAR and ${VAR}
+                    expanded = _expand_vars(raw_script, env_vars)
+                    pkg_dir = pathlib.Path(__file__).parent.resolve()
+                    repo_root = pathlib.Path.cwd().resolve()
+                    repo_pdd_dir = (repo_root / 'pdd').resolve()
+                    candidate = pathlib.Path(expanded)
+                    if not candidate.is_absolute():
+                        as_is = (repo_root / candidate)
+                        under_repo_pdd = (repo_pdd_dir / candidate.name) if not as_is.exists() else as_is
+                        under_pkg = (pkg_dir / candidate.name) if not as_is.exists() and not under_repo_pdd.exists() else as_is
+                        if as_is.exists():
+                            candidate = as_is
+                        elif under_repo_pdd.exists():
+                            candidate = under_repo_pdd
+                        elif under_pkg.exists():
+                            candidate = under_pkg
+                        else:
+                            candidate = as_is
+                    post_process_script = str(candidate.resolve())
+            # Fallback default: for architecture template, use built-in render_mermaid.py
+            if not post_process_script:
+                try:
+                    prompt_str = str(prompt_file)
+                    looks_like_arch_template = (
+                        (isinstance(prompt_file, str) and (
+                            prompt_str.endswith("architecture/architecture_json.prompt") or
+                            prompt_str.endswith("architecture/architecture_json") or
+                            "architecture_json.prompt" in prompt_str or
+                            "architecture/architecture_json" in prompt_str
+                        ))
+                    )
+                    looks_like_arch_output = (
+                        bool(output_path) and pathlib.Path(str(output_path)).name == 'architecture.json'
+                    )
+                    if looks_like_arch_template or looks_like_arch_output:
+                        pkg_dir = pathlib.Path(__file__).parent
+                        repo_pdd_dir = pathlib.Path.cwd() / 'pdd'
+                        if (pkg_dir / 'render_mermaid.py').exists():
+                            post_process_script = str((pkg_dir / 'render_mermaid.py').resolve())
+                        elif (repo_pdd_dir / 'render_mermaid.py').exists():
+                            post_process_script = str((repo_pdd_dir / 'render_mermaid.py').resolve())
+                except Exception:
+                    post_process_script = None
+            if verbose:
+                console.print(f"[blue]Post-process script resolved to:[/blue] {post_process_script if post_process_script else 'None'}")
+        except Exception:
+            post_process_script = None
+        # If LLM is disabled but no post-process script is provided, surface a helpful error
+        if not llm_enabled and not post_process_script:
+            console.print("[red]Error: llm: false requires 'post_process_python' to be specified in front matter.[/red]")
+            return "", was_incremental_operation, total_cost, "error"
+        if llm_enabled and can_attempt_incremental and existing_code_content is not None and original_prompt_content_for_incremental is not None:
             if verbose:
                 console.print(Panel("Attempting incremental code generation...", title="[blue]Mode[/blue]", expand=False))
@@ -326,9 +730,18 @@ def code_generator_main(
                 if files_to_stage_for_rollback:
                     git_add_files(files_to_stage_for_rollback, verbose=verbose)
+            # Preprocess both prompts: expand includes, substitute vars, then double
+            orig_proc = pdd_preprocess(original_prompt_content_for_incremental, recursive=True, double_curly_brackets=False)
+            orig_proc = _expand_vars(orig_proc, env_vars)
+            orig_proc = pdd_preprocess(orig_proc, recursive=False, double_curly_brackets=True)
+            new_proc = pdd_preprocess(prompt_content, recursive=True, double_curly_brackets=False)
+            new_proc = _expand_vars(new_proc, env_vars)
+            new_proc = pdd_preprocess(new_proc, recursive=False, double_curly_brackets=True)
             generated_code_content, was_incremental_operation, total_cost, model_name = incremental_code_generator_func(
-                original_prompt=original_prompt_content_for_incremental,
-                new_prompt=prompt_content,
+                original_prompt=orig_proc,
+                new_prompt=new_proc,
                 existing_code=existing_code_content,
                 language=language,
                 strength=strength,
@@ -336,7 +749,7 @@ def code_generator_main(
                 time=time_budget,
                 force_incremental=force_incremental_flag,
                 verbose=verbose,
-                preprocess_prompt=True
+                preprocess_prompt=False
             )
             if not was_incremental_operation:
@@ -345,7 +758,7 @@ def code_generator_main(
             elif verbose:
                 console.print(Panel(f"Incremental update successful. Model: {model_name}, Cost: ${total_cost:.6f}", title="[green]Incremental Success[/green]", expand=False))
-        if not was_incremental_operation: # Full generation path
+        if llm_enabled and not was_incremental_operation: # Full generation path
             if verbose:
                 console.print(Panel("Performing full code generation...", title="[blue]Mode[/blue]", expand=False))
@@ -353,8 +766,10 @@ def code_generator_main(
             if not current_execution_is_local:
                 if verbose: console.print("Attempting cloud code generation...")
-                processed_prompt_for_cloud = pdd_preprocess(prompt_content, recursive=True, double_curly_brackets=True, exclude_keys=[])
+                # Expand includes, substitute vars, then double
+                processed_prompt_for_cloud = pdd_preprocess(prompt_content, recursive=True, double_curly_brackets=False, exclude_keys=[])
+                processed_prompt_for_cloud = _expand_vars(processed_prompt_for_cloud, env_vars)
+                processed_prompt_for_cloud = pdd_preprocess(processed_prompt_for_cloud, recursive=False, double_curly_brackets=True, exclude_keys=[])
                 if verbose: console.print(Panel(Text(processed_prompt_for_cloud, overflow="fold"), title="[cyan]Preprocessed Prompt for Cloud[/cyan]", expand=False))
                 jwt_token: Optional[str] = None
@@ -389,7 +804,7 @@ def code_generator_main(
                         total_cost = float(response_data.get("totalCost", 0.0))
                         model_name = response_data.get("modelName", "cloud_model")
-                        if generated_code_content is None:
+                        if not generated_code_content:
                             console.print("[yellow]Cloud execution returned no code. Falling back to local.[/yellow]")
                             current_execution_is_local = True
                         elif verbose:
@@ -410,36 +825,268 @@ def code_generator_main(
             if current_execution_is_local:
                 if verbose: console.print("Executing code generator locally...")
+                # Expand includes, substitute vars, then double; pass to local generator with preprocess_prompt=False
+                local_prompt = pdd_preprocess(prompt_content, recursive=True, double_curly_brackets=False, exclude_keys=[])
+                local_prompt = _expand_vars(local_prompt, env_vars)
+                local_prompt = pdd_preprocess(local_prompt, recursive=False, double_curly_brackets=True, exclude_keys=[])
+                # Language already resolved (front matter overrides detection if present)
+                gen_language = language
+                # Extract output schema from front matter if available
+                output_schema = fm_meta.get("output_schema") if fm_meta else None
                 generated_code_content, total_cost, model_name = local_code_generator_func(
-                    prompt=prompt_content,
-                    language=language,
+                    prompt=local_prompt,
+                    language=gen_language,
                     strength=strength,
                     temperature=temperature,
                     time=time_budget,
                     verbose=verbose,
-                    preprocess_prompt=True
+                    preprocess_prompt=False,
+                    output_schema=output_schema,
                 )
                 was_incremental_operation = False
                 if verbose:
                     console.print(Panel(f"Full generation successful. Model: {model_name}, Cost: ${total_cost:.6f}", title="[green]Local Success[/green]", expand=False))
+        # Optional post-process Python hook (runs after LLM when enabled, or standalone when LLM is disabled)
+        if post_process_script:
+            try:
+                python_executable = detect_host_python_executable()
+                # Choose stdin for the script: LLM output if available and enabled, else prompt body
+                stdin_payload = generated_code_content if (llm_enabled and generated_code_content is not None) else prompt_body_for_script
+                env = os.environ.copy()
+                env['PDD_LANGUAGE'] = str(language or '')
+                env['PDD_OUTPUT_PATH'] = str(output_path or '')
+                env['PDD_PROMPT_FILE'] = str(pathlib.Path(prompt_file).resolve())
+                env['PDD_LLM'] = '1' if llm_enabled else '0'
+                try:
+                    env['PDD_ENV_VARS'] = json.dumps(env_vars or {})
+                except Exception:
+                    env['PDD_ENV_VARS'] = '{}'
+                # If front matter provides args, run in argv mode with a temp input file
+                fm_args = None
+                try:
+                    # Env/CLI override for args (comma-separated or JSON list)
+                    raw_args_env = None
+                    if env_vars:
+                        raw_args_env = env_vars.get('POST_PROCESS_ARGS') or env_vars.get('post_process_args')
+                    if not raw_args_env:
+                        raw_args_env = os.environ.get('POST_PROCESS_ARGS') or os.environ.get('post_process_args')
+                    if raw_args_env:
+                        s = str(raw_args_env).strip()
+                        parsed_list = None
+                        if s.startswith('[') and s.endswith(']'):
+                            try:
+                                parsed = json.loads(s)
+                                if isinstance(parsed, list):
+                                    parsed_list = [str(a) for a in parsed]
+                            except Exception:
+                                parsed_list = None
+                        if parsed_list is None:
+                            if ',' in s:
+                                parsed_list = [part.strip() for part in s.split(',') if part.strip()]
+                            else:
+                                parsed_list = [part for part in s.split() if part]
+                        fm_args = parsed_list or None
+                    if fm_args is None:
+                        raw_args = fm_meta.get('post_process_args') if isinstance(fm_meta, dict) else None
+                        if isinstance(raw_args, list):
+                            fm_args = [str(a) for a in raw_args]
+                except Exception:
+                    fm_args = None
+                proc = None
+                temp_input_path = None
+                try:
+                    if fm_args is None:
+                        # Provide sensible default args for architecture template with render_mermaid.py
+                        try:
+                            if post_process_script and pathlib.Path(post_process_script).name == 'render_mermaid.py':
+                                if isinstance(prompt_file, str) and prompt_file.endswith('architecture/architecture_json.prompt'):
+                                    fm_args = ["{INPUT_FILE}", "{APP_NAME}", "{OUTPUT_HTML}"]
+                        except Exception:
+                            pass
+                    if fm_args:
+                        # When LLM is disabled, use the existing output file instead of creating a temp file
+                        if not llm_enabled and output_path and pathlib.Path(output_path).exists():
+                            temp_input_path = str(pathlib.Path(output_path).resolve())
+                            env['PDD_POSTPROCESS_INPUT_FILE'] = temp_input_path
+                        else:
+                            # Write payload to a temp file for scripts expecting a file path input
+                            suffix = '.json' if (isinstance(language, str) and str(language).lower().strip() == 'json') or (output_path and str(output_path).lower().endswith('.json')) else '.txt'
+                            if output_path and llm_enabled:
+                                temp_input_path = str(pathlib.Path(output_path).resolve())
+                                pathlib.Path(temp_input_path).parent.mkdir(parents=True, exist_ok=True)
+                                with open(temp_input_path, 'w', encoding='utf-8') as f:
+                                    f.write(stdin_payload or '')
+                            else:
+                                with tempfile.NamedTemporaryFile(mode='w', delete=False, suffix=suffix, encoding='utf-8') as tf:
+                                    tf.write(stdin_payload or '')
+                                    temp_input_path = tf.name
+                            env['PDD_POSTPROCESS_INPUT_FILE'] = temp_input_path
+                        # Compute placeholder values
+                        app_name_val = (env_vars or {}).get('APP_NAME') if env_vars else None
+                        if not app_name_val:
+                            app_name_val = 'System Architecture'
+                        output_html_default = None
+                        if output_path and str(output_path).lower().endswith('.json'):
+                            output_html_default = str(pathlib.Path(output_path).with_name(f"{pathlib.Path(output_path).stem}_diagram.html").resolve())
+                        placeholder_map = {
+                            'INPUT_FILE': temp_input_path or '',
+                            'OUTPUT': str(output_path or ''),
+                            'PROMPT_FILE': str(pathlib.Path(prompt_file).resolve()),
+                            'APP_NAME': str(app_name_val),
+                            'OUTPUT_HTML': str(output_html_default or ''),
+                        }
+                        def _subst_arg(arg: str) -> str:
+                            # First expand $VARS using existing helper, then {TOKENS}
+                            expanded = _expand_vars(arg, env_vars)
+                            for key, val in placeholder_map.items():
+                                expanded = expanded.replace('{' + key + '}', val)
+                            return expanded
+                        args_list = [_subst_arg(a) for a in fm_args]
+                        if verbose:
+                            console.print(Panel(f"Post-process hook (argv)\nScript: {post_process_script}\nArgs: {args_list}", title="[blue]Post-process[/blue]", expand=False))
+                        proc = subprocess.run(
+                            [python_executable, post_process_script] + args_list,
+                            text=True,
+                            capture_output=True,
+                            timeout=300,
+                            cwd=str(pathlib.Path(post_process_script).parent),
+                            env=env
+                        )
+                    else:
+                        # Run the script with stdin payload, capture stdout as final content
+                        if verbose:
+                            console.print(Panel(f"Post-process hook (stdin)\nScript: {post_process_script}", title="[blue]Post-process[/blue]", expand=False))
+                        proc = subprocess.run(
+                            [python_executable, post_process_script],
+                            input=stdin_payload or '',
+                            text=True,
+                            capture_output=True,
+                            timeout=300,
+                            cwd=str(pathlib.Path(post_process_script).parent),
+                            env=env
+                        )
+                finally:
+                    if temp_input_path:
+                        try:
+                            # Only delete temp files, not the actual output file when llm=false
+                            if llm_enabled or not (output_path and pathlib.Path(output_path).exists() and temp_input_path == str(pathlib.Path(output_path).resolve())):
+                                os.unlink(temp_input_path)
+                        except Exception:
+                            pass
+                if proc and proc.returncode == 0:
+                    if verbose:
+                        console.print(Panel(f"Post-process success (rc=0)\nstdout: {proc.stdout[:150]}\nstderr: {proc.stderr[:150]}", title="[green]Post-process[/green]", expand=False))
+                    # Do not modify generated_code_content to preserve architecture.json
+                else:
+                    rc = getattr(proc, 'returncode', 'N/A')
+                    err = getattr(proc, 'stderr', '')
+                    console.print(f"[yellow]Post-process failed (rc={rc}). Stderr:\n{err[:500]}[/yellow]")
+            except FileNotFoundError:
+                console.print(f"[yellow]Post-process script not found: {post_process_script}. Skipping.[/yellow]")
+            except subprocess.TimeoutExpired:
+                console.print("[yellow]Post-process script timed out. Skipping.[/yellow]")
+            except Exception as e:
+                console.print(f"[yellow]Post-process script error: {e}. Skipping.[/yellow]")
         if generated_code_content is not None:
+            # Optional output_schema JSON validation before writing (only when LLM ran)
+            if llm_enabled:
+                try:
+                    if fm_meta and isinstance(fm_meta.get("output_schema"), dict):
+                        is_json_output = False
+                        if isinstance(language, str) and str(language).lower().strip() == "json":
+                            is_json_output = True
+                        elif output_path and str(output_path).lower().endswith(".json"):
+                            is_json_output = True
+                        if is_json_output:
+                            # Check if the generated content is an error message from llm_invoke
+                            if generated_code_content.strip().startswith("ERROR:"):
+                                raise click.UsageError(f"LLM generation failed: {generated_code_content}")
+                            parsed = json.loads(generated_code_content)
+                            if _is_architecture_template(fm_meta):
+                                parsed, repaired = _repair_architecture_interface_types(parsed)
+                                if repaired:
+                                    generated_code_content = json.dumps(parsed, indent=2)
+                            try:
+                                import jsonschema
+                                jsonschema.validate(instance=parsed, schema=fm_meta.get("output_schema"))
+                            except ModuleNotFoundError:
+                                if verbose and not quiet:
+                                    console.print("[yellow]jsonschema not installed; skipping schema validation.[/yellow]")
+                            except Exception as ve:
+                                raise click.UsageError(f"Generated JSON does not match output_schema: {ve}")
+                except json.JSONDecodeError as jde:
+                    raise click.UsageError(f"Generated output is not valid JSON: {jde}")
             if output_path:
                 p_output = pathlib.Path(output_path)
                 p_output.parent.mkdir(parents=True, exist_ok=True)
                 p_output.write_text(generated_code_content, encoding="utf-8")
                 if verbose or not quiet:
                     console.print(f"Generated code saved to: [green]{p_output.resolve()}[/green]")
-            elif not quiet: # No output path, print to console if not quiet
-                console.print(Panel(Text(generated_code_content, overflow="fold"), title="[cyan]Generated Code[/cyan]", expand=True))
+                # Safety net: ensure architecture HTML is generated post-write if applicable
+                try:
+                    # Prefer resolved script if available; else default for architecture outputs
+                    script_path2 = post_process_script
+                    if not script_path2:
+                        looks_like_arch_output2 = pathlib.Path(str(p_output)).name == 'architecture.json'
+                        if looks_like_arch_output2:
+                            pkg_dir2 = pathlib.Path(__file__).parent
+                            repo_pdd_dir2 = pathlib.Path.cwd() / 'pdd'
+                            if (pkg_dir2 / 'render_mermaid.py').exists():
+                                script_path2 = str((pkg_dir2 / 'render_mermaid.py').resolve())
+                            elif (repo_pdd_dir2 / 'render_mermaid.py').exists():
+                                script_path2 = str((repo_pdd_dir2 / 'render_mermaid.py').resolve())
+                    if script_path2 and pathlib.Path(script_path2).exists():
+                        app_name2 = os.environ.get('APP_NAME') or (env_vars or {}).get('APP_NAME') or 'System Architecture'
+                        out_html2 = os.environ.get('POST_PROCESS_OUTPUT') or str(p_output.with_name(f"{p_output.stem}_diagram.html").resolve())
+                        html_missing = not pathlib.Path(out_html2).exists()
+                        always_run_for_arch = pathlib.Path(str(p_output)).name == 'architecture.json'
+                        if always_run_for_arch or html_missing:
+                            try:
+                                py_exec2 = detect_host_python_executable()
+                            except Exception:
+                                py_exec2 = sys.executable
+                            if verbose:
+                                console.print(Panel(f"Safety net post-process\nScript: {script_path2}\nArgs: {[str(p_output.resolve()), app_name2, out_html2]}", title="[blue]Post-process[/blue]", expand=False))
+                            sp2 = subprocess.run([py_exec2, script_path2, str(p_output.resolve()), app_name2, out_html2],
+                                                 capture_output=True, text=True, cwd=str(pathlib.Path(script_path2).parent))
+                            if sp2.returncode == 0 and not quiet:
+                                print(f"✅ Generated: {out_html2}")
+                            elif verbose:
+                                console.print(f"[yellow]Safety net failed (rc={sp2.returncode}). stderr:\n{sp2.stderr[:300]}[/yellow]")
+                except Exception:
+                    pass
+                # Post-step now runs regardless of LLM value via the general post-process hook above.
+            elif not quiet:
+                # No destination resolved; surface the generated code directly to the console.
+                console.print(Panel(Text(generated_code_content, overflow="fold"), title="[cyan]Generated Code[/cyan]", expand=False))
+                console.print("[yellow]No output path resolved; skipping file write and stdout print.[/yellow]")
         else:
-            console.print("[red]Error: Code generation failed. No code was produced.[/red]")
-            return "", was_incremental_operation, total_cost, model_name or "error"
+            # If LLM was disabled and post-process ran, that's a success (no error)
+            if not llm_enabled and post_process_script:
+                if verbose or not quiet:
+                    console.print("[green]Post-process completed successfully (LLM was disabled).[/green]")
+            else:
+                console.print("[red]Error: Code generation failed. No code was produced.[/red]")
+                return "", was_incremental_operation, total_cost, model_name or "error"
+    except click.Abort:
+        # User cancelled - re-raise to stop the sync loop
+        raise
     except Exception as e:
-        console.print(f"[red]An unexpected error occurred: {e}[/red]")
-        import traceback
-        if verbose: console.print(traceback.format_exc())
-        return "", was_incremental_operation, total_cost, "error"
+        if isinstance(e, click.UsageError):
+            raise
+        # For any other unexpected error, we should fail hard so the CLI exits non-zero
+        # Log the detailed traceback first if verbose
+        if verbose:
+            import traceback
+            console.print(traceback.format_exc())
+        raise click.UsageError(f"An unexpected error occurred: {e}")
-    return generated_code_content or "", was_incremental_operation, total_cost, model_name
+    return generated_code_content or "", was_incremental_operation, total_cost, model_name

pdd-cli 0.0.42__py3-none-any.whl → 0.0.90__py3-none-any.whl

pdd-cli 0.0.42py3-none-any.whl → 0.0.90py3-none-any.whl