PyPI - pdd-cli - Versions diffs - 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl - Mend

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (195) hide show

pdd/__init__.py +40 -8
pdd/agentic_bug.py +323 -0
pdd/agentic_bug_orchestrator.py +497 -0
pdd/agentic_change.py +231 -0
pdd/agentic_change_orchestrator.py +526 -0
pdd/agentic_common.py +598 -0
pdd/agentic_crash.py +534 -0
pdd/agentic_e2e_fix.py +319 -0
pdd/agentic_e2e_fix_orchestrator.py +426 -0
pdd/agentic_fix.py +1294 -0
pdd/agentic_langtest.py +162 -0
pdd/agentic_update.py +387 -0
pdd/agentic_verify.py +183 -0
pdd/architecture_sync.py +565 -0
pdd/auth_service.py +210 -0
pdd/auto_deps_main.py +71 -51
pdd/auto_include.py +245 -5
pdd/auto_update.py +125 -47
pdd/bug_main.py +196 -23
pdd/bug_to_unit_test.py +2 -0
pdd/change_main.py +11 -4
pdd/cli.py +22 -1181
pdd/cmd_test_main.py +350 -150
pdd/code_generator.py +60 -18
pdd/code_generator_main.py +790 -57
pdd/commands/__init__.py +48 -0
pdd/commands/analysis.py +306 -0
pdd/commands/auth.py +309 -0
pdd/commands/connect.py +290 -0
pdd/commands/fix.py +163 -0
pdd/commands/generate.py +257 -0
pdd/commands/maintenance.py +175 -0
pdd/commands/misc.py +87 -0
pdd/commands/modify.py +256 -0
pdd/commands/report.py +144 -0
pdd/commands/sessions.py +284 -0
pdd/commands/templates.py +215 -0
pdd/commands/utility.py +110 -0
pdd/config_resolution.py +58 -0
pdd/conflicts_main.py +8 -3
pdd/construct_paths.py +589 -111
pdd/context_generator.py +10 -2
pdd/context_generator_main.py +175 -76
pdd/continue_generation.py +53 -10
pdd/core/__init__.py +33 -0
pdd/core/cli.py +527 -0
pdd/core/cloud.py +237 -0
pdd/core/dump.py +554 -0
pdd/core/errors.py +67 -0
pdd/core/remote_session.py +61 -0
pdd/core/utils.py +90 -0
pdd/crash_main.py +262 -33
pdd/data/language_format.csv +71 -63
pdd/data/llm_model.csv +20 -18
pdd/detect_change_main.py +5 -4
pdd/docs/prompting_guide.md +864 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/benchmark_analysis.py +495 -0
pdd/docs/whitepaper_with_benchmarks/data_and_functions/creation_compare.py +528 -0
pdd/fix_code_loop.py +523 -95
pdd/fix_code_module_errors.py +6 -2
pdd/fix_error_loop.py +491 -92
pdd/fix_errors_from_unit_tests.py +4 -3
pdd/fix_main.py +278 -21
pdd/fix_verification_errors.py +12 -100
pdd/fix_verification_errors_loop.py +529 -286
pdd/fix_verification_main.py +294 -89
pdd/frontend/dist/assets/index-B5DZHykP.css +1 -0
pdd/frontend/dist/assets/index-DQ3wkeQ2.js +449 -0
pdd/frontend/dist/index.html +376 -0
pdd/frontend/dist/logo.svg +33 -0
pdd/generate_output_paths.py +139 -15
pdd/generate_test.py +218 -146
pdd/get_comment.py +19 -44
pdd/get_extension.py +8 -9
pdd/get_jwt_token.py +318 -22
pdd/get_language.py +8 -7
pdd/get_run_command.py +75 -0
pdd/get_test_command.py +68 -0
pdd/git_update.py +70 -19
pdd/incremental_code_generator.py +2 -2
pdd/insert_includes.py +13 -4
pdd/llm_invoke.py +1711 -181
pdd/load_prompt_template.py +19 -12
pdd/path_resolution.py +140 -0
pdd/pdd_completion.fish +25 -2
pdd/pdd_completion.sh +30 -4
pdd/pdd_completion.zsh +79 -4
pdd/postprocess.py +14 -4
pdd/preprocess.py +293 -24
pdd/preprocess_main.py +41 -6
pdd/prompts/agentic_bug_step10_pr_LLM.prompt +182 -0
pdd/prompts/agentic_bug_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_bug_step2_docs_LLM.prompt +129 -0
pdd/prompts/agentic_bug_step3_triage_LLM.prompt +95 -0
pdd/prompts/agentic_bug_step4_reproduce_LLM.prompt +97 -0
pdd/prompts/agentic_bug_step5_root_cause_LLM.prompt +123 -0
pdd/prompts/agentic_bug_step6_test_plan_LLM.prompt +107 -0
pdd/prompts/agentic_bug_step7_generate_LLM.prompt +172 -0
pdd/prompts/agentic_bug_step8_verify_LLM.prompt +119 -0
pdd/prompts/agentic_bug_step9_e2e_test_LLM.prompt +289 -0
pdd/prompts/agentic_change_step10_identify_issues_LLM.prompt +1006 -0
pdd/prompts/agentic_change_step11_fix_issues_LLM.prompt +984 -0
pdd/prompts/agentic_change_step12_create_pr_LLM.prompt +131 -0
pdd/prompts/agentic_change_step1_duplicate_LLM.prompt +73 -0
pdd/prompts/agentic_change_step2_docs_LLM.prompt +101 -0
pdd/prompts/agentic_change_step3_research_LLM.prompt +126 -0
pdd/prompts/agentic_change_step4_clarify_LLM.prompt +164 -0
pdd/prompts/agentic_change_step5_docs_change_LLM.prompt +981 -0
pdd/prompts/agentic_change_step6_devunits_LLM.prompt +1005 -0
pdd/prompts/agentic_change_step7_architecture_LLM.prompt +1044 -0
pdd/prompts/agentic_change_step8_analyze_LLM.prompt +1027 -0
pdd/prompts/agentic_change_step9_implement_LLM.prompt +1077 -0
pdd/prompts/agentic_crash_explore_LLM.prompt +49 -0
pdd/prompts/agentic_e2e_fix_step1_unit_tests_LLM.prompt +90 -0
pdd/prompts/agentic_e2e_fix_step2_e2e_tests_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step3_root_cause_LLM.prompt +89 -0
pdd/prompts/agentic_e2e_fix_step4_fix_e2e_tests_LLM.prompt +96 -0
pdd/prompts/agentic_e2e_fix_step5_identify_devunits_LLM.prompt +91 -0
pdd/prompts/agentic_e2e_fix_step6_create_unit_tests_LLM.prompt +106 -0
pdd/prompts/agentic_e2e_fix_step7_verify_tests_LLM.prompt +116 -0
pdd/prompts/agentic_e2e_fix_step8_run_pdd_fix_LLM.prompt +120 -0
pdd/prompts/agentic_e2e_fix_step9_verify_all_LLM.prompt +146 -0
pdd/prompts/agentic_fix_explore_LLM.prompt +45 -0
pdd/prompts/agentic_fix_harvest_only_LLM.prompt +48 -0
pdd/prompts/agentic_fix_primary_LLM.prompt +85 -0
pdd/prompts/agentic_update_LLM.prompt +925 -0
pdd/prompts/agentic_verify_explore_LLM.prompt +45 -0
pdd/prompts/auto_include_LLM.prompt +122 -905
pdd/prompts/change_LLM.prompt +3093 -1
pdd/prompts/detect_change_LLM.prompt +686 -27
pdd/prompts/example_generator_LLM.prompt +22 -1
pdd/prompts/extract_code_LLM.prompt +5 -1
pdd/prompts/extract_program_code_fix_LLM.prompt +7 -1
pdd/prompts/extract_prompt_update_LLM.prompt +7 -8
pdd/prompts/extract_promptline_LLM.prompt +17 -11
pdd/prompts/find_verification_errors_LLM.prompt +6 -0
pdd/prompts/fix_code_module_errors_LLM.prompt +12 -2
pdd/prompts/fix_errors_from_unit_tests_LLM.prompt +9 -0
pdd/prompts/fix_verification_errors_LLM.prompt +22 -0
pdd/prompts/generate_test_LLM.prompt +41 -7
pdd/prompts/generate_test_from_example_LLM.prompt +115 -0
pdd/prompts/increase_tests_LLM.prompt +1 -5
pdd/prompts/insert_includes_LLM.prompt +316 -186
pdd/prompts/prompt_code_diff_LLM.prompt +119 -0
pdd/prompts/prompt_diff_LLM.prompt +82 -0
pdd/prompts/trace_LLM.prompt +25 -22
pdd/prompts/unfinished_prompt_LLM.prompt +85 -1
pdd/prompts/update_prompt_LLM.prompt +22 -1
pdd/pytest_output.py +127 -12
pdd/remote_session.py +876 -0
pdd/render_mermaid.py +236 -0
pdd/server/__init__.py +52 -0
pdd/server/app.py +335 -0
pdd/server/click_executor.py +587 -0
pdd/server/executor.py +338 -0
pdd/server/jobs.py +661 -0
pdd/server/models.py +241 -0
pdd/server/routes/__init__.py +31 -0
pdd/server/routes/architecture.py +451 -0
pdd/server/routes/auth.py +364 -0
pdd/server/routes/commands.py +929 -0
pdd/server/routes/config.py +42 -0
pdd/server/routes/files.py +603 -0
pdd/server/routes/prompts.py +1322 -0
pdd/server/routes/websocket.py +473 -0
pdd/server/security.py +243 -0
pdd/server/terminal_spawner.py +209 -0
pdd/server/token_counter.py +222 -0
pdd/setup_tool.py +648 -0
pdd/simple_math.py +2 -0
pdd/split_main.py +3 -2
pdd/summarize_directory.py +237 -195
pdd/sync_animation.py +8 -4
pdd/sync_determine_operation.py +839 -112
pdd/sync_main.py +351 -57
pdd/sync_orchestration.py +1400 -756
pdd/sync_tui.py +848 -0
pdd/template_expander.py +161 -0
pdd/template_registry.py +264 -0
pdd/templates/architecture/architecture_json.prompt +237 -0
pdd/templates/generic/generate_prompt.prompt +174 -0
pdd/trace.py +168 -12
pdd/trace_main.py +4 -3
pdd/track_cost.py +140 -63
pdd/unfinished_prompt.py +51 -4
pdd/update_main.py +567 -67
pdd/update_model_costs.py +2 -2
pdd/update_prompt.py +19 -4
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/METADATA +29 -11
pdd_cli-0.0.118.dist-info/RECORD +227 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/licenses/LICENSE +1 -1
pdd_cli-0.0.45.dist-info/RECORD +0 -116
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/WHEEL +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/entry_points.txt +0 -0
{pdd_cli-0.0.45.dist-info → pdd_cli-0.0.118.dist-info}/top_level.txt +0 -0

pdd/templates/generic/generate_prompt.prompt ADDED Viewed

@@ -0,0 +1,174 @@
+---
+name: generic/generate_prompt
+description: Generate a module prompt (.prompt) for any stack (backend, frontend, CLI, jobs) using project docs and context
+version: 1.0.0
+tags: [template, prompt, generic]
+language: prompt
+output: prompts/${MODULE}_${LANG_OR_FRAMEWORK}.prompt
+variables:
+  MODULE:
+    required: true
+    type: string
+    description: Module/component basename to generate a prompt for.
+    examples: [orders, auth, users]
+  LANG_OR_FRAMEWORK:
+    required: false
+    type: string
+    description: Target language or framework suffix used in prompt naming (matches your stack conventions).
+    examples: [Python, TypeScriptReact, Go, Java, Ruby]
+    default: Python
+  LAYER:
+    required: false
+    type: string
+    description: System layer or interface type for context.
+    examples: [backend, frontend, api, graphql, cli, job, message, config, module, component, page]
+  PRD_FILE:
+    required: false
+    type: path
+    description: Product requirements document providing overall context.
+    example_paths: [PRD.md, docs/product/prd.md]
+  API_DOC_FILE:
+    required: false
+    type: path
+    description: API documentation describing endpoints and conventions.
+    example_paths: [docs/api-documentation.md, docs/api.md]
+  DB_SCHEMA_FILE:
+    required: false
+    type: path
+    description: Database schema or ERD for backend data models.
+    example_paths: [context/database-schema.md, docs/db/schema.md]
+  BACKEND_FILES_CSV:
+    required: false
+    type: path
+    description: CSV listing backend Python files/modules (for context/reference).
+    example_paths: [prompts/backend/python_architecture.csv]
+  IO_DEPENDENCIES_CSV:
+    required: false
+    type: path
+    description: CSV of function inputs/outputs and dependencies for backend modules.
+    example_paths: [prompts/backend/io_dependencies.csv]
+  ARCHITECTURE_FILE:
+    required: true
+    type: path
+    description: Architecture JSON (from architecture/architecture_json) to drive module scope, dependencies, and interface.
+    example_paths: [architecture.json]
+  TECH_STACK_FILE:
+    required: false
+    type: path
+    description: Tech stack overview (languages, frameworks, infrastructure, tools) for shaping conventions.
+    example_paths: [docs/tech_stack.md, docs/architecture/stack.md]
+  CODE_GENERATOR_PROMPT:
+    required: false
+    type: path
+    description: Reference code generator prompt to mirror style and expectations.
+    example_paths: [prompts/code_generator_python.prompt, prompts/code_generator_main_python.prompt]
+  EXISTING_PROMPTS:
+    required: false
+    type: list
+    description: Existing prompt files to use as reference (comma/newline-separated).
+    example_paths: [prompts/orders_python.prompt, prompts/auth_python.prompt]
+  DEP_EXAMPLE_EXT:
+    required: false
+    type: string
+    description: File extension for dependency examples under context/ (for non-Python stacks).
+    examples: [py, ts, tsx, go, java]
+    default: py
+usage:
+  generate:
+    - name: Minimal (architecture only)
+      command: pdd generate --template generic/generate_prompt -e MODULE=orders -e LANG_OR_FRAMEWORK=Python -e ARCHITECTURE_FILE=architecture.json --output 'prompts/${MODULE}_${LANG_OR_FRAMEWORK}.prompt'
+    - name: With project docs
+      command: pdd generate --template generic/generate_prompt -e MODULE=orders -e LANG_OR_FRAMEWORK=Python -e ARCHITECTURE_FILE=architecture.json -e PRD_FILE=docs/PRD.md -e API_DOC_FILE=docs/api-documentation.md -e DB_SCHEMA_FILE=context/database-schema.md --output 'prompts/${MODULE}_${LANG_OR_FRAMEWORK}.prompt'
+    - name: With CSVs and references (backend/Python)
+      command: pdd generate --template generic/generate_prompt -e MODULE=orders -e LANG_OR_FRAMEWORK=Python -e ARCHITECTURE_FILE=architecture.json -e PRD_FILE=docs/PRD.md -e API_DOC_FILE=docs/api-documentation.md -e DB_SCHEMA_FILE=context/database-schema.md -e BACKEND_FILES_CSV=prompts/backend/python_architecture.csv -e IO_DEPENDENCIES_CSV=prompts/backend/io_dependencies.csv -e CODE_GENERATOR_PROMPT=prompts/code_generator_python.prompt --output 'prompts/${MODULE}_${LANG_OR_FRAMEWORK}.prompt'
+    - name: Frontend (TypeScriptReact) variant
+      command: pdd generate --template generic/generate_prompt -e MODULE=profile_page -e LANG_OR_FRAMEWORK=TypeScriptReact -e LAYER=frontend -e ARCHITECTURE_FILE=architecture.json -e PRD_FILE=docs/PRD.md --output 'prompts/${MODULE}_${LANG_OR_FRAMEWORK}.prompt'
+    - name: From architecture.json
+      command: pdd generate --template generic/generate_prompt -e MODULE=orders_api -e LANG_OR_FRAMEWORK=Python -e LAYER=api -e ARCHITECTURE_FILE=architecture.json --output 'prompts/${MODULE}_${LANG_OR_FRAMEWORK}.prompt'
+discover:
+  enabled: false
+  max_per_pattern: 5
+  max_total: 10
+---
+% You are an expert prompt writer and software architect for PDD. Your goal is to write a high-quality prompt that will generate the code for the ${MODULE} module/component. The prompt you create will be used to produce a detailed implementation specification in a file named ${MODULE}_${LANG_OR_FRAMEWORK}.prompt, suitable for the specified stack and layer.
+IMPORTANT: Your reply MUST begin with `<prompt>` on the very first line and end with `</prompt>` on the final line. Do not include any text, whitespace, or code fences outside this block.
+% Project context (architecture required, others optional):
+<prd><include>${PRD_FILE}</include></prd>
+<api><include>${API_DOC_FILE}</include></api>
+<database><include>${DB_SCHEMA_FILE}</include></database>
+<backend_files_csv><include>${BACKEND_FILES_CSV}</include></backend_files_csv>
+<io_dependencies_csv><include>${IO_DEPENDENCIES_CSV}</include></io_dependencies_csv>
+<architecture><include>${ARCHITECTURE_FILE}</include></architecture>
+<tech_stack><include>${TECH_STACK_FILE}</include></tech_stack>
+<generate_code_cli_example><include>${CODE_GENERATOR_PROMPT}</include></generate_code_cli_example>
+% Existing prompt references (optional):
+<existing_backend_prompts><include-many>${EXISTING_PROMPTS}</include-many></existing_backend_prompts>
+% Do the following:
+- Explain concisely what you are going to do (create a prompt for the ${MODULE} module/component for the specified layer and stack).
+- Analyze any difficulties this prompt might encounter for ${MODULE} (e.g., data modeling, API or UI contracts, transactions, idempotency, auth, state management, error handling) and briefly state mitigation strategies tailored to the given LAYER and LANG_OR_FRAMEWORK.
+- Use the ARCHITECTURE_FILE to identify the item that corresponds to this prompt by matching `filename` to `${MODULE}_${LANG_OR_FRAMEWORK}.prompt` (or best match by basename and layer). Use that item’s `reason`, `description`, `dependencies`, `interface`, and `tags` to shape the sections below.
+- Then create the prompt content for ${MODULE} inside XML tags named prompt, ensuring conventions fit the stack and layer.
+- Ensure the final response consists solely of the `<prompt>...</prompt>` block; nothing else (including whitespace) may appear before `<prompt>` or after `</prompt>`.
+% The prompt you generate must follow this structure:
+1) First paragraph: describe the role and responsibility of the ${MODULE} module/component within the system (consider the LAYER if provided).
+2) A "Requirements" section with numbered points covering functionality, contracts, error handling, validation, logging, performance, and security.
+3) A "Dependencies" section using XML include tags for each dependency (see format below).
+4) An "Instructions" section with precise implementation guidance (clarify inputs/outputs, function/class responsibilities, edge cases, and testing notes).
+5) A clear "Deliverable" section describing the expected code artifacts and entry points.
+% Dependencies format and conventions:
+- Represent each dependency using an XML tag with the dependency name, and put the file path inside an <include> tag, e.g.:
+  <orders_service>
+    <include>context/orders_service_example.${DEP_EXAMPLE_EXT}</include>
+  </orders_service>
+- Prefer real example files available in the provided context (use <include-many> when listing multiple). If examples are not provided, assume dependency examples live under context/ using the pattern context/[dependency_name]_example.${DEP_EXAMPLE_EXT}.
+- Include all necessary dependencies for the module/component (based on the provided context and references).
+- The ARCHITECTURE_FILE lists `dependencies` referencing other prompt filenames. Convert each dependency prompt filename into a sensible dependency name (strip language suffix and `_prompt`), and map to context files with the `${DEP_EXAMPLE_EXT}` extension if present; otherwise, list the prompt filename explicitly in a "Prompt Dependencies" subsection.
+% Architecture awareness (ARCHITECTURE_FILE is required):
+- Align the "Requirements" and "Instructions" with the selected item’s `interface.type` (e.g., page, component, module, api, graphql, cli, job, message, config).
+- For `api`, outline endpoints (method, path, auth) consistent with the architecture description; for `page`/`component`, describe route/props/data sources; for `job`, include trigger and retry policy; for `config`, list keys and sources.
+% Style and quality requirements:
+- The generated prompt must be detailed enough to yield production-ready code.
+- Match the style and patterns of existing *_${LANG_OR_FRAMEWORK}.prompt files when present.
+- Do not invent technologies or files; rely on the included context. If assumptions are necessary, state them explicitly and conservatively.
+% Output contract:
+- Start the output with `<prompt>` on its own line and end with `</prompt>` on its own line.
+- Do not emit any characters (including whitespace, markdown fences, or commentary) outside the `<prompt>...</prompt>` block.
+- Within the tags, include the sections described above as plain text.
+- OUTPUT FORMAT (authoritative – copy/paste and replace the bracketed placeholders, keeping every literal token):
+  ```text
+  <prompt>
+  {ROLE_PARAGRAPH}
+  Requirements
+  1. {REQ_ITEM_1}
+  2. {REQ_ITEM_2}
+  Dependencies
+  <{DEPENDENCY_TAG_1}>
+    <include>{DEPENDENCY_INCLUDE_1}</include>
+  </{DEPENDENCY_TAG_1}>
+  {OPTIONAL_ADDITIONAL_DEPENDENCY_TAGS}
+  Prompt Dependencies:
+  {PROMPT_DEPENDENCIES_SECTION}
+  Instructions
+  - {INSTRUCTION_1}
+  - {INSTRUCTION_2}
+  Deliverable
+  - {DELIVERABLE_1}
+  - {DELIVERABLE_2}
+  Implementation assumptions (explicit)
+  - {ASSUMPTION_1}
+  - {ASSUMPTION_2}
+  Please produce production-ready prompt content that will generate the module consistent with the above.
+  </prompt>
+  ```
+  Replace each `{PLACEHOLDER}` with concrete content while preserving the surrounding structure and literal `<prompt>` / `<include>` tags.

pdd/trace.py CHANGED Viewed

@@ -1,14 +1,48 @@
-from typing import Tuple, Optional
+from typing import Tuple, Optional, List
 from rich import print
 from rich.console import Console
 from pydantic import BaseModel, Field
 import difflib
+import re
 from .load_prompt_template import load_prompt_template
 from .preprocess import preprocess
 from .llm_invoke import llm_invoke
 from . import DEFAULT_TIME, DEFAULT_STRENGTH
 console = Console()
+def _normalize_text(value: str) -> str:
+    if value is None:
+        return ""
+    value = value.replace("\u201c", '"').replace("\u201d", '"')
+    value = value.replace("\u2018", "'").replace("\u2019", "'")
+    value = value.replace("\u00A0", " ")
+    value = re.sub(r"\s+", " ", value.strip())
+    return value
+def _fallback_prompt_line(prompt_lines: List[str], code_str: str) -> int:
+    """Best-effort deterministic fallback to select a prompt line."""
+    normalized_code = _normalize_text(code_str).casefold()
+    tokens = [tok for tok in re.split(r"\W+", normalized_code) if len(tok) >= 3]
+    token_best_idx: Optional[int] = None
+    token_best_hits = 0
+    if tokens:
+        for i, line in enumerate(prompt_lines, 1):
+            normalized_line = _normalize_text(line).casefold()
+            hits = sum(1 for tok in tokens if tok in normalized_line)
+            if hits > token_best_hits:
+                token_best_hits = hits
+                token_best_idx = i
+    if token_best_idx is not None and token_best_hits > 0:
+        return token_best_idx
+    for i, line in enumerate(prompt_lines, 1):
+        if _normalize_text(line):
+            return i
+    return 1
 class PromptLineOutput(BaseModel):
     prompt_line: str = Field(description="The line from the prompt file that matches the code")
@@ -102,38 +136,160 @@ def trace(
         # Step 7: Find matching line in prompt file using fuzzy matching
         prompt_lines = prompt_file.splitlines()
         best_match = None
-        highest_ratio = 0
+        highest_ratio = 0.0
         if verbose:
             console.print(f"Searching for line: {prompt_line_str}")
-        normalized_search = prompt_line_str.strip()
+        # Robust normalization for comparison
+        # If the model echoed wrapper tags like <llm_output>...</llm_output>, extract inner text
+        raw_search = prompt_line_str
+        try:
+            m = re.search(r"<\s*llm_output\s*>(.*?)<\s*/\s*llm_output\s*>", raw_search, flags=re.IGNORECASE | re.DOTALL)
+            if m:
+                raw_search = m.group(1)
+        except Exception:
+            pass
+        normalized_search = _normalize_text(raw_search).casefold()
+        best_candidate_idx = None
+        best_candidate_len = 0
         for i, line in enumerate(prompt_lines, 1):
-            normalized_line = line.strip()
+            normalized_line = _normalize_text(line).casefold()
+            line_len = len(normalized_line)
+            # Base similarity
             ratio = difflib.SequenceMatcher(None, normalized_search, normalized_line).ratio()
+            # Boost if one contains the other, but avoid trivial/short lines
+            if normalized_search and line_len >= 8:
+                shorter = min(len(normalized_search), line_len)
+                longer = max(len(normalized_search), line_len)
+                length_ratio = shorter / longer if longer else 0.0
+                if length_ratio >= 0.4 and (
+                    normalized_search in normalized_line or normalized_line in normalized_search
+                ):
+                    ratio = max(ratio, 0.999)
             if verbose:
                 console.print(f"Line {i}: '{line}' - Match ratio: {ratio}")
-            # Increase threshold to 0.9 for more precise matching
-            if ratio > highest_ratio and ratio > 0.9:
-                # Additional check for exact content match after normalization
-                if normalized_search == normalized_line:
+            # Track best candidate overall, skipping empty lines
+            if line_len > 0:
+                if ratio > highest_ratio:
                     highest_ratio = ratio
-                    best_match = i
-                    break  # Exit on exact match
-                highest_ratio = ratio
+                    best_candidate_idx = i
+                    best_candidate_len = line_len
+                elif abs(ratio - highest_ratio) < 1e-6 and best_candidate_idx is not None:
+                    # Tie-breaker: prefer longer normalized line
+                    if line_len > best_candidate_len:
+                        best_candidate_idx = i
+                        best_candidate_len = line_len
+            # Early exit on exact normalized equality
+            if normalized_search == normalized_line:
                 best_match = i
+                highest_ratio = 1.0
+                break
+        # Decide on acceptance thresholds
+        primary_threshold = 0.8  # lowered threshold for normal acceptance
+        fallback_threshold = 0.6  # low-confidence fallback threshold
+        if best_match is None and best_candidate_idx is not None:
+            if highest_ratio >= primary_threshold:
+                best_match = best_candidate_idx
+            elif highest_ratio >= fallback_threshold:
+                best_match = best_candidate_idx
+                if verbose:
+                    console.print(
+                        f"[yellow]Low-confidence match selected (ratio={highest_ratio:.3f}).[/yellow]"
+                    )
+        # Step 7b: Multi-line window matching (sizes 2 and 3) if no strong single-line match
+        if (best_match is None) or (highest_ratio < primary_threshold):
+            if verbose:
+                console.print("[blue]No strong single-line match; trying multi-line windows...[/blue]")
+            win_best_ratio = 0.0
+            win_best_idx: Optional[int] = None
+            win_best_size = 0
+            for window_size in (2, 3):
+                if len(prompt_lines) < window_size:
+                    continue
+                for start_idx in range(1, len(prompt_lines) - window_size + 2):
+                    window_lines = prompt_lines[start_idx - 1 : start_idx - 1 + window_size]
+                    window_text = " ".join(window_lines)
+                    normalized_window = _normalize_text(window_text).casefold()
+                    seg_len = len(normalized_window)
+                    if seg_len == 0:
+                        continue
+                    ratio = difflib.SequenceMatcher(None, normalized_search, normalized_window).ratio()
+                    # Containment boost under similar length condition
+                    shorter = min(len(normalized_search), seg_len)
+                    longer = max(len(normalized_search), seg_len)
+                    length_ratio = (shorter / longer) if longer else 0.0
+                    if (
+                        normalized_search
+                        and seg_len >= 8
+                        and length_ratio >= 0.4
+                        and (
+                            normalized_search in normalized_window
+                            or normalized_window in normalized_search
+                        )
+                    ):
+                        ratio = max(ratio, 0.999)
+                    if verbose:
+                        console.print(
+                            f"Window {start_idx}-{start_idx+window_size-1}: ratio={ratio}"
+                        )
+                    # Track best window, prefer higher ratio; tie-breaker: larger window, then longer segment
+                    if ratio > win_best_ratio + 1e-6 or (
+                        abs(ratio - win_best_ratio) < 1e-6
+                        and (window_size > win_best_size or (window_size == win_best_size and seg_len > 0))
+                    ):
+                        win_best_ratio = ratio
+                        win_best_idx = start_idx
+                        win_best_size = window_size
+            if win_best_idx is not None and win_best_ratio > highest_ratio:
+                if win_best_ratio >= primary_threshold:
+                    best_match = win_best_idx
+                    highest_ratio = win_best_ratio
+                elif win_best_ratio >= fallback_threshold and best_match is None:
+                    best_match = win_best_idx
+                    highest_ratio = win_best_ratio
+                    if verbose:
+                        console.print(
+                            f"[yellow]Low-confidence multi-line match selected (ratio={win_best_ratio:.3f}).[/yellow]"
+                        )
+        # Step 7c: Deterministic fallback when LLM output cannot be matched reliably
+        fallback_used = False
+        if best_match is None:
+            best_match = _fallback_prompt_line(prompt_lines, code_str)
+            fallback_used = True
         # Step 8: Return results
         if verbose:
             console.print(f"[green]Found matching line: {best_match}[/green]")
             console.print(f"[green]Total cost: ${total_cost:.6f}[/green]")
             console.print(f"[green]Model used: {model_name}[/green]")
+            if fallback_used:
+                console.print("[yellow]Fallback matching heuristic was used.[/yellow]")
         return best_match, total_cost, model_name
     except Exception as e:
         console.print(f"[bold red]Error in trace function: {str(e)}[/bold red]")
-        return None, 0.0, ""
+        try:
+            fallback_line = _fallback_prompt_line(prompt_file.splitlines(), code_file.splitlines()[code_line - 1] if 0 < code_line <= len(code_file.splitlines()) else "")
+        except Exception:
+            fallback_line = 1
+        return fallback_line, 0.0, "fallback"

pdd/trace_main.py CHANGED Viewed

@@ -5,7 +5,7 @@ import os
 import logging
 from .construct_paths import construct_paths
 from .trace import trace
-from . import DEFAULT_TIME, DEFAULT_STRENGTH
+from . import DEFAULT_TIME, DEFAULT_STRENGTH, DEFAULT_TEMPERATURE
 logging.basicConfig(level=logging.WARNING)
 logger = logging.getLogger(__name__)
@@ -39,7 +39,8 @@ def trace_main(ctx: click.Context, prompt_file: str, code_file: str, code_line:
             force=ctx.obj.get('force', False),
             quiet=quiet,
             command="trace",
-            command_options=command_options
+            command_options=command_options,
+            context_override=ctx.obj.get('context')
         )
         logger.debug("File paths constructed successfully")
@@ -50,7 +51,7 @@ def trace_main(ctx: click.Context, prompt_file: str, code_file: str, code_line:
         # Perform trace analysis
         strength = ctx.obj.get('strength', DEFAULT_STRENGTH)
-        temperature = ctx.obj.get('temperature', 0.0)
+        temperature = ctx.obj.get('temperature', DEFAULT_TEMPERATURE)
         time = ctx.obj.get('time', DEFAULT_TIME)
         try:
             prompt_line, total_cost, model_name = trace(

pdd/track_cost.py CHANGED Viewed

@@ -14,53 +14,88 @@ def track_cost(func):
             return func(*args, **kwargs)
         start_time = datetime.now()
-        try:
-            result = func(*args, **kwargs)
-        except Exception as e:
-            raise e
-        end_time = datetime.now()
+        result = None
+        exception_raised = None
         try:
-            if ctx.obj and hasattr(ctx.obj, 'get'):
-                output_cost_path = ctx.obj.get('output_cost') or os.getenv('PDD_OUTPUT_COST_PATH')
-            else:
-                output_cost_path = os.getenv('PDD_OUTPUT_COST_PATH')
-            if not output_cost_path:
-                return result
-            command_name = ctx.command.name
-            cost, model_name = extract_cost_and_model(result)
-            input_files, output_files = collect_files(args, kwargs)
-            timestamp = start_time.strftime('%Y-%m-%dT%H:%M:%S.%f')[:-3]
-            row = {
-                'timestamp': timestamp,
-                'model': model_name,
-                'command': command_name,
-                'cost': cost,
-                'input_files': ';'.join(input_files),
-                'output_files': ';'.join(output_files),
-            }
-            file_exists = os.path.isfile(output_cost_path)
-            fieldnames = ['timestamp', 'model', 'command', 'cost', 'input_files', 'output_files']
-            with open(output_cost_path, 'a', newline='', encoding='utf-8') as csvfile:
-                writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
-                if not file_exists:
-                    writer.writeheader()
-                writer.writerow(row)
-            print(f"Debug: Writing row to CSV: {row}")
-            print(f"Debug: Input files: {input_files}")
-            print(f"Debug: Output files: {output_files}")
+            # Record the invoked subcommand name on the shared ctx.obj so
+            # the CLI result callback can display proper names instead of
+            # falling back to "Unknown Command X".
+            try:
+                # Avoid interfering with pytest-based CLI tests which expect
+                # Click's default behavior (yielding "Unknown Command X").
+                if not os.environ.get('PYTEST_CURRENT_TEST'):
+                    if ctx.obj is not None:
+                        invoked = ctx.obj.get('invoked_subcommands') or []
+                        # Use the current command name if available
+                        cmd_name = ctx.command.name if ctx.command else None
+                        if cmd_name:
+                            invoked.append(cmd_name)
+                            ctx.obj['invoked_subcommands'] = invoked
+            except Exception:
+                # Non-fatal: if we cannot record, proceed normally
+                pass
+            result = func(*args, **kwargs)
         except Exception as e:
-            rprint(f"[red]Error tracking cost: {e}[/red]")
+            exception_raised = e
+        finally:
+            end_time = datetime.now()
+            try:
+                # Always collect files for core dump, even if output_cost is not set
+                input_files, output_files = collect_files(args, kwargs)
+                # Store collected files in context for core dump (even if output_cost not set)
+                if ctx.obj is not None and ctx.obj.get('core_dump'):
+                    files_set = ctx.obj.get('core_dump_files', set())
+                    for f in input_files + output_files:
+                        if isinstance(f, str) and f:
+                            # Convert to absolute path for reliable access later
+                            abs_path = os.path.abspath(f)
+                            # Add the file if it exists OR if it looks like a file path
+                            # (it might have been created/deleted during command execution)
+                            if os.path.exists(abs_path) or '.' in os.path.basename(f):
+                                files_set.add(abs_path)
+                    ctx.obj['core_dump_files'] = files_set
+                # Check if we need to write cost tracking (only on success)
+                if exception_raised is None:
+                    if ctx.obj and hasattr(ctx.obj, 'get'):
+                        output_cost_path = ctx.obj.get('output_cost') or os.getenv('PDD_OUTPUT_COST_PATH')
+                    else:
+                        output_cost_path = os.getenv('PDD_OUTPUT_COST_PATH')
+                    if output_cost_path:
+                        command_name = ctx.command.name
+                        cost, model_name = extract_cost_and_model(result)
+                        timestamp = start_time.strftime('%Y-%m-%dT%H:%M:%S.%f')[:-3]
+                        row = {
+                            'timestamp': timestamp,
+                            'model': model_name,
+                            'command': command_name,
+                            'cost': cost,
+                            'input_files': ';'.join(input_files),
+                            'output_files': ';'.join(output_files),
+                        }
+                        file_exists = os.path.isfile(output_cost_path)
+                        fieldnames = ['timestamp', 'model', 'command', 'cost', 'input_files', 'output_files']
+                        with open(output_cost_path, 'a', newline='', encoding='utf-8') as csvfile:
+                            writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
+                            if not file_exists:
+                                writer.writeheader()
+                            writer.writerow(row)
+            except Exception as e:
+                rprint(f"[red]Error tracking cost: {e}[/red]")
+        # Re-raise the exception if one occurred
+        if exception_raised is not None:
+            raise exception_raised
         return result
@@ -75,28 +110,70 @@ def collect_files(args, kwargs):
     input_files = []
     output_files = []
-    # Collect from args
-    for arg in args:
-        if isinstance(arg, str):
-            input_files.append(arg)
-        elif isinstance(arg, list):
-            input_files.extend([f for f in arg if isinstance(f, str)])
-    # Collect from kwargs
+    # Known input parameter names that typically contain file paths
+    input_param_names = {
+        'prompt_file', 'prompt', 'input', 'input_file', 'source', 'source_file',
+        'file', 'path', 'original_prompt_file_path', 'files', 'core_file',
+        'code_file', 'unit_test_file', 'error_file', 'test_file', 'example_file'
+    }
+    # Known output parameter names (anything with 'output' in the name)
+    output_param_names = {
+        'output', 'output_file', 'output_path', 'destination', 'dest', 'target',
+        'output_test', 'output_code', 'output_results'
+    }
+    # Helper to check if something looks like a file path
+    def looks_like_file(path_str):
+        """Check if string looks like a file path."""
+        if not path_str or not isinstance(path_str, str):
+            return False
+        # Has file extension or exists
+        return '.' in os.path.basename(path_str) or os.path.isfile(path_str)
+    # Collect from kwargs (most reliable since Click uses named parameters)
     for k, v in kwargs.items():
-        if k == 'output_cost':
+        if k in ('ctx', 'context', 'output_cost'):
             continue
-        if isinstance(v, str):
-            if k.startswith('output'):
-                output_files.append(v)
-            else:
-                input_files.append(v)
+        # Check if this is a known parameter name
+        is_input_param = k in input_param_names or 'file' in k.lower() or 'prompt' in k.lower()
+        is_output_param = k in output_param_names or 'output' in k.lower()
+        if isinstance(v, str) and v:
+            # For known parameter names, trust that they represent file paths
+            # For unknown parameters, check if it looks like a file
+            if is_input_param or is_output_param or looks_like_file(v):
+                if is_output_param:
+                    output_files.append(v)
+                elif is_input_param:
+                    input_files.append(v)
+                else:
+                    # Unknown parameter but looks like a file, treat as input
+                    input_files.append(v)
         elif isinstance(v, list):
-            if k.startswith('output'):
-                output_files.extend([f for f in v if isinstance(f, str)])
-            else:
-                input_files.extend([f for f in v if isinstance(f, str)])
+            for item in v:
+                if isinstance(item, str) and item:
+                    # Same logic for list items
+                    if is_input_param or is_output_param or looks_like_file(item):
+                        if is_output_param:
+                            output_files.append(item)
+                        elif is_input_param:
+                            input_files.append(item)
+                        else:
+                            input_files.append(item)
+    # Collect from positional args (skip first arg which is usually Click context)
+    for i, arg in enumerate(args):
+        # Skip first argument if it looks like a Click context
+        if i == 0 and hasattr(arg, 'obj'):
+            continue
+        if isinstance(arg, str) and arg and looks_like_file(arg):
+            input_files.append(arg)
+        elif isinstance(arg, list):
+            for item in arg:
+                if isinstance(item, str) and item and looks_like_file(item):
+                    input_files.append(item)
-    print(f"Debug: Collected input files: {input_files}")
-    print(f"Debug: Collected output files: {output_files}")
     return input_files, output_files

pdd-cli 0.0.45__py3-none-any.whl → 0.0.118__py3-none-any.whl

pdd-cli 0.0.45py3-none-any.whl → 0.0.118py3-none-any.whl