PyPI - amd-gaia - Versions diffs - 0.14.3__py3-none-any.whl → 0.15.1__py3-none-any.whl - Mend

amd-gaia 0.14.3py3-none-any.whl → 0.15.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (181) hide show

{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/METADATA +223 -223
amd_gaia-0.15.1.dist-info/RECORD +178 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/entry_points.txt +1 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/licenses/LICENSE.md +20 -20
gaia/__init__.py +29 -29
gaia/agents/__init__.py +19 -19
gaia/agents/base/__init__.py +9 -9
gaia/agents/base/agent.py +2177 -2177
gaia/agents/base/api_agent.py +120 -120
gaia/agents/base/console.py +1841 -1841
gaia/agents/base/errors.py +237 -237
gaia/agents/base/mcp_agent.py +86 -86
gaia/agents/base/tools.py +83 -83
gaia/agents/blender/agent.py +556 -556
gaia/agents/blender/agent_simple.py +133 -135
gaia/agents/blender/app.py +211 -211
gaia/agents/blender/app_simple.py +41 -41
gaia/agents/blender/core/__init__.py +16 -16
gaia/agents/blender/core/materials.py +506 -506
gaia/agents/blender/core/objects.py +316 -316
gaia/agents/blender/core/rendering.py +225 -225
gaia/agents/blender/core/scene.py +220 -220
gaia/agents/blender/core/view.py +146 -146
gaia/agents/chat/__init__.py +9 -9
gaia/agents/chat/agent.py +835 -835
gaia/agents/chat/app.py +1058 -1058
gaia/agents/chat/session.py +508 -508
gaia/agents/chat/tools/__init__.py +15 -15
gaia/agents/chat/tools/file_tools.py +96 -96
gaia/agents/chat/tools/rag_tools.py +1729 -1729
gaia/agents/chat/tools/shell_tools.py +436 -436
gaia/agents/code/__init__.py +7 -7
gaia/agents/code/agent.py +549 -549
gaia/agents/code/cli.py +377 -0
gaia/agents/code/models.py +135 -135
gaia/agents/code/orchestration/__init__.py +24 -24
gaia/agents/code/orchestration/checklist_executor.py +1763 -1763
gaia/agents/code/orchestration/checklist_generator.py +713 -713
gaia/agents/code/orchestration/factories/__init__.py +9 -9
gaia/agents/code/orchestration/factories/base.py +63 -63
gaia/agents/code/orchestration/factories/nextjs_factory.py +118 -118
gaia/agents/code/orchestration/factories/python_factory.py +106 -106
gaia/agents/code/orchestration/orchestrator.py +841 -841
gaia/agents/code/orchestration/project_analyzer.py +391 -391
gaia/agents/code/orchestration/steps/__init__.py +67 -67
gaia/agents/code/orchestration/steps/base.py +188 -188
gaia/agents/code/orchestration/steps/error_handler.py +314 -314
gaia/agents/code/orchestration/steps/nextjs.py +828 -828
gaia/agents/code/orchestration/steps/python.py +307 -307
gaia/agents/code/orchestration/template_catalog.py +469 -469
gaia/agents/code/orchestration/workflows/__init__.py +14 -14
gaia/agents/code/orchestration/workflows/base.py +80 -80
gaia/agents/code/orchestration/workflows/nextjs.py +186 -186
gaia/agents/code/orchestration/workflows/python.py +94 -94
gaia/agents/code/prompts/__init__.py +11 -11
gaia/agents/code/prompts/base_prompt.py +77 -77
gaia/agents/code/prompts/code_patterns.py +2036 -2036
gaia/agents/code/prompts/nextjs_prompt.py +40 -40
gaia/agents/code/prompts/python_prompt.py +109 -109
gaia/agents/code/schema_inference.py +365 -365
gaia/agents/code/system_prompt.py +41 -41
gaia/agents/code/tools/__init__.py +42 -42
gaia/agents/code/tools/cli_tools.py +1138 -1138
gaia/agents/code/tools/code_formatting.py +319 -319
gaia/agents/code/tools/code_tools.py +769 -769
gaia/agents/code/tools/error_fixing.py +1347 -1347
gaia/agents/code/tools/external_tools.py +180 -180
gaia/agents/code/tools/file_io.py +845 -845
gaia/agents/code/tools/prisma_tools.py +190 -190
gaia/agents/code/tools/project_management.py +1016 -1016
gaia/agents/code/tools/testing.py +321 -321
gaia/agents/code/tools/typescript_tools.py +122 -122
gaia/agents/code/tools/validation_parsing.py +461 -461
gaia/agents/code/tools/validation_tools.py +806 -806
gaia/agents/code/tools/web_dev_tools.py +1758 -1758
gaia/agents/code/validators/__init__.py +16 -16
gaia/agents/code/validators/antipattern_checker.py +241 -241
gaia/agents/code/validators/ast_analyzer.py +197 -197
gaia/agents/code/validators/requirements_validator.py +145 -145
gaia/agents/code/validators/syntax_validator.py +171 -171
gaia/agents/docker/__init__.py +7 -7
gaia/agents/docker/agent.py +642 -642
gaia/agents/emr/__init__.py +8 -8
gaia/agents/emr/agent.py +1506 -1506
gaia/agents/emr/cli.py +1322 -1322
gaia/agents/emr/constants.py +475 -475
gaia/agents/emr/dashboard/__init__.py +4 -4
gaia/agents/emr/dashboard/server.py +1974 -1974
gaia/agents/jira/__init__.py +11 -11
gaia/agents/jira/agent.py +894 -894
gaia/agents/jira/jql_templates.py +299 -299
gaia/agents/routing/__init__.py +7 -7
gaia/agents/routing/agent.py +567 -570
gaia/agents/routing/system_prompt.py +75 -75
gaia/agents/summarize/__init__.py +11 -0
gaia/agents/summarize/agent.py +885 -0
gaia/agents/summarize/prompts.py +129 -0
gaia/api/__init__.py +23 -23
gaia/api/agent_registry.py +238 -238
gaia/api/app.py +305 -305
gaia/api/openai_server.py +575 -575
gaia/api/schemas.py +186 -186
gaia/api/sse_handler.py +373 -373
gaia/apps/__init__.py +4 -4
gaia/apps/llm/__init__.py +6 -6
gaia/apps/llm/app.py +173 -169
gaia/apps/summarize/app.py +116 -633
gaia/apps/summarize/html_viewer.py +133 -133
gaia/apps/summarize/pdf_formatter.py +284 -284
gaia/audio/__init__.py +2 -2
gaia/audio/audio_client.py +439 -439
gaia/audio/audio_recorder.py +269 -269
gaia/audio/kokoro_tts.py +599 -599
gaia/audio/whisper_asr.py +432 -432
gaia/chat/__init__.py +16 -16
gaia/chat/app.py +430 -430
gaia/chat/prompts.py +522 -522
gaia/chat/sdk.py +1228 -1225
gaia/cli.py +5481 -5621
gaia/database/__init__.py +10 -10
gaia/database/agent.py +176 -176
gaia/database/mixin.py +290 -290
gaia/database/testing.py +64 -64
gaia/eval/batch_experiment.py +2332 -2332
gaia/eval/claude.py +542 -542
gaia/eval/config.py +37 -37
gaia/eval/email_generator.py +512 -512
gaia/eval/eval.py +3179 -3179
gaia/eval/groundtruth.py +1130 -1130
gaia/eval/transcript_generator.py +582 -582
gaia/eval/webapp/README.md +167 -167
gaia/eval/webapp/package-lock.json +875 -875
gaia/eval/webapp/package.json +20 -20
gaia/eval/webapp/public/app.js +3402 -3402
gaia/eval/webapp/public/index.html +87 -87
gaia/eval/webapp/public/styles.css +3661 -3661
gaia/eval/webapp/server.js +415 -415
gaia/eval/webapp/test-setup.js +72 -72
gaia/llm/__init__.py +9 -2
gaia/llm/base_client.py +60 -0
gaia/llm/exceptions.py +12 -0
gaia/llm/factory.py +70 -0
gaia/llm/lemonade_client.py +3236 -3221
gaia/llm/lemonade_manager.py +294 -294
gaia/llm/providers/__init__.py +9 -0
gaia/llm/providers/claude.py +108 -0
gaia/llm/providers/lemonade.py +120 -0
gaia/llm/providers/openai_provider.py +79 -0
gaia/llm/vlm_client.py +382 -382
gaia/logger.py +189 -189
gaia/mcp/agent_mcp_server.py +245 -245
gaia/mcp/blender_mcp_client.py +138 -138
gaia/mcp/blender_mcp_server.py +648 -648
gaia/mcp/context7_cache.py +332 -332
gaia/mcp/external_services.py +518 -518
gaia/mcp/mcp_bridge.py +811 -550
gaia/mcp/servers/__init__.py +6 -6
gaia/mcp/servers/docker_mcp.py +83 -83
gaia/perf_analysis.py +361 -0
gaia/rag/__init__.py +10 -10
gaia/rag/app.py +293 -293
gaia/rag/demo.py +304 -304
gaia/rag/pdf_utils.py +235 -235
gaia/rag/sdk.py +2194 -2194
gaia/security.py +163 -163
gaia/talk/app.py +289 -289
gaia/talk/sdk.py +538 -538
gaia/testing/__init__.py +87 -87
gaia/testing/assertions.py +330 -330
gaia/testing/fixtures.py +333 -333
gaia/testing/mocks.py +493 -493
gaia/util.py +46 -46
gaia/utils/__init__.py +33 -33
gaia/utils/file_watcher.py +675 -675
gaia/utils/parsing.py +223 -223
gaia/version.py +100 -100
amd_gaia-0.14.3.dist-info/RECORD +0 -168
gaia/agents/code/app.py +0 -266
gaia/llm/llm_client.py +0 -729
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/WHEEL +0 -0
{amd_gaia-0.14.3.dist-info → amd_gaia-0.15.1.dist-info}/top_level.txt +0 -0

gaia/agents/code/orchestration/checklist_generator.py CHANGED Viewed

@@ -1,713 +1,713 @@
-# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
-# SPDX-License-Identifier: MIT
-"""Checklist Generator for LLM-Driven Code Generation.
-This module uses an LLM to generate a checklist of template invocations
-based on the user's request and the available template catalog.
-The generator:
-1. Receives user request and project context
-2. Sends prompt to LLM with template catalog
-3. Parses LLM response into structured checklist
-4. Validates checklist items against template definitions
-The resulting checklist is then executed deterministically by
-ChecklistExecutor.
-"""
-import json
-import logging
-import re
-from dataclasses import dataclass, field
-from typing import Any, Dict, List, Optional, Protocol
-from .steps.base import UserContext
-from .template_catalog import get_catalog_prompt, validate_checklist_item
-logger = logging.getLogger(__name__)
-class ChatSDK(Protocol):
-    """Protocol for chat SDK interface."""
-    def send(self, message: str, timeout: int = 600, no_history: bool = False) -> Any:
-        """Send a message and get response."""
-        ...
-@dataclass
-class ChecklistItem:
-    """Single item in the generated checklist.
-    Represents a template invocation with its parameters and
-    the LLM's reasoning for including it.
-    """
-    template: str
-    params: Dict[str, Any]
-    description: str
-    def to_dict(self) -> Dict[str, Any]:
-        """Convert to dictionary representation."""
-        return {
-            "template": self.template,
-            "params": self.params,
-            "description": self.description,
-        }
-@dataclass
-class GeneratedChecklist:
-    """Complete checklist generated by LLM.
-    Contains the list of template invocations and the LLM's
-    overall reasoning for the chosen approach.
-    """
-    items: List[ChecklistItem]
-    reasoning: str
-    raw_response: str = ""
-    validation_errors: List[str] = field(default_factory=list)
-    @property
-    def is_valid(self) -> bool:
-        """Check if checklist passed validation."""
-        return len(self.validation_errors) == 0
-    def to_dict(self) -> Dict[str, Any]:
-        """Convert to dictionary representation."""
-        return {
-            "reasoning": self.reasoning,
-            "checklist": [item.to_dict() for item in self.items],
-            "is_valid": self.is_valid,
-            "validation_errors": self.validation_errors,
-        }
-@dataclass
-class ProjectState:
-    """Current state of the project for context."""
-    exists: bool = False
-    has_package_json: bool = False
-    has_prisma: bool = False
-    has_next_config: bool = False
-    existing_models: List[str] = field(default_factory=list)
-    existing_routes: List[str] = field(default_factory=list)
-    existing_pages: List[str] = field(default_factory=list)
-    def to_prompt(self) -> str:
-        """Generate prompt-friendly description of project state."""
-        if not self.exists:
-            return "Project does not exist yet - will be created fresh."
-        lines = ["Current project state:"]
-        if self.has_package_json:
-            lines.append("- ✓ package.json exists (Node.js project)")
-        if self.has_next_config:
-            lines.append("- ✓ next.config.ts exists (Next.js configured)")
-        if self.has_prisma:
-            lines.append("- ✓ Prisma configured")
-            if self.existing_models:
-                lines.append(f"  - Models: {', '.join(self.existing_models)}")
-        if self.existing_routes:
-            lines.append(f"- Existing API routes: {', '.join(self.existing_routes)}")
-        if self.existing_pages:
-            lines.append(f"- Existing pages: {', '.join(self.existing_pages)}")
-        return "\n".join(lines)
-CHECKLIST_SYSTEM_PROMPT = """You are a code generation planner. Your task is to analyze the user's request and generate a checklist of template invocations that will create the requested application.
-{catalog_prompt}
-## Instructions
-1. Analyze the user's request carefully
-2. Consider what the user ACTUALLY wants (semantic understanding)
-3. Select templates that will fulfill the request
-4. Add semantic enhancements based on the request type:
-   - For "todo" apps: add checkboxes for completion status
-   - For "blog" apps: add date fields for posts
-   - For "e-commerce": add price, inventory fields
-5. Ensure dependencies are satisfied (run setup before data, data before API, API before UI)
-6. Generate a complete checklist that creates a working application
-7. When follow-up fixes are requested, use `fix_code` to repair the specific files called out by validation/test logs. Extract the precise file paths and line numbers from the errors (see the Raw Validation Logs) and pass those line numbers inside the error description so the fixer knows exactly where to focus. Always reference the latest findings to decide which fixes to schedule before running validations again.
-8. If the user explicitly requests an additional UI artifact (countdown display, stats badge, etc.), schedule a `generate_react_component` step with the appropriate `artifact-*` variant (e.g., `"artifact-timer"`) and a descriptive `component_name`. Keep the artifact's logic inside that client component—server components like `page.tsx` should only render the artifact and pass any required props.
-9. **Route pairing requirement:** Whenever you schedule `{{"template": "generate_api_route", "params": {{"type": "collection", ...}}}}`, you MUST also include a matching `generate_api_route` item with `"type": "item"` for the same resource so detail pages can call `/api/<resource>/[id]`.
-This workflow repeats until all validations pass, so each checklist should either advance new functionality or explicitly repair the failures reported in the latest validation logs.
-## IMPORTANT: Complete CRUD Applications
-For any app that manages resources (todos, posts, users, etc.), you MUST generate ALL of these UI components:
-1. **Form component** (variant: "form") - Reusable form for create (generate this first so other pages can import it)
-2. **Artifact components** (variant: "artifact-*") - Any additional UI artifacts requested by the user (e.g., countdown display, stats badge). Generate these before any page that consumes them.
-3. **New page** (variant: "new") - Create new item at /resources/new
-4. **Edit page** (variant: "detail") - Edit single item at /resources/[id] with pre-populated form
-5. **List page** (variant: "list") - Main page showing all items at /resources
-Missing any of the required components (form, new, detail, list) will result in broken navigation! When artifacts are requested, they must also be generated or the UI will be incomplete.
-## REQUIRED: Setup and Validation Commands
-**CRITICAL**: The following commands are REQUIRED for a valid plan:
-1. **setup_app_styling** MUST be included after creating the application (after `create_next_app`). This configures app-wide styling with modern dark theme design system.
-2. **setup_testing** MUST be included after `setup_app_styling`. This sets up the testing infrastructure.
-3. **generate_style_tests** MUST be included after `setup_testing`. This generates CSS integrity tests that validate the design system.
-4. **The final 2 commands MUST be in this exact order:**
-   - Second-to-last: `run_typescript_check` (validates TypeScript compilation)
-   - Last: `validate_styles` (validates CSS files and design system)
-These setup and validation commands are mandatory - a plan without them is INVALID.
-## Output Format
-Respond with ONLY a JSON object (no markdown code blocks):
-{{
-  "reasoning": "Brief explanation of your approach and any semantic enhancements",
-  "checklist": [
-    {{"template": "template_name", "params": {{}}, "description": "Why this step is needed"}}
-  ]
-}}
-Important:
-- Use exact template names from the catalog
-- Provide all required parameters
-- Order items by dependency (setup first, then data, then API, then UI)
-- REQUIRED ordering for `generate_react_component`: emit all non-`list` variants (form, new, detail, actions, artifact-*) before the `variant: "list"` call so the list can import previously generated components
-- Add semantic enhancements that make the app intuitive (e.g., checkboxes for todos)
-- For CRUD apps, ALWAYS include all 4 UI variants: list, form, new, detail
-- REQUIRED: Include `setup_app_styling` after `create_next_app`
-- REQUIRED: Include `setup_testing` after `setup_app_styling`
-- REQUIRED: Include `generate_style_tests` after `setup_testing`
-- REQUIRED: End with `run_typescript_check`, then `validate_styles` as the last 2 commands
-- When converting a raw validation error into `fix_code`, copy the exact snippet (file, line, column, and message). For example:
-  Raw Validation Logs (example):
-  ```
-  {{"template": "run_typescript_check", "output": {{"errors": "path/to/File.tsx(10,5): error TS1234: <error text>\\n"}}}}
-  ```
-  Corresponding checklist item:
-  ```
-  {{
-    "template": "fix_code",
-    "params": {{
-      "file_path": "path/to/File.tsx",
-      "error_description": "path/to/File.tsx(10,5): error TS1234: <error text>"
-    }},
-    "description": "Fix the TypeScript compiler error reported for File.tsx."
-  }}
-  ```
-  Always keep the error text verbatim so the fixer knows exactly where to edit."""
-class ChecklistGenerator:
-    """Generate execution checklist using LLM.
-    The generator sends the user request, project state, and template
-    catalog to an LLM, which returns a structured checklist of template
-    invocations.
-    """
-    def __init__(self, chat_sdk: ChatSDK):
-        """Initialize the checklist generator.
-        Args:
-            chat_sdk: Chat SDK instance for LLM communication
-        """
-        self.chat = chat_sdk
-    def generate_initial_checklist(
-        self,
-        context: UserContext,
-        project_state: Optional[ProjectState] = None,
-    ) -> GeneratedChecklist:
-        """Generate the initial project-scaffolding checklist."""
-        if project_state is None:
-            project_state = ProjectState()
-        system_prompt = CHECKLIST_SYSTEM_PROMPT.format(
-            catalog_prompt=get_catalog_prompt()
-        )
-        user_prompt = self._build_initial_prompt(context, project_state)
-        full_prompt = f"{system_prompt}\n\n## User Request\n\n{user_prompt}"
-        return self._generate_from_prompt(full_prompt)
-    def generate_debug_checklist(
-        self,
-        context: UserContext,
-        project_state: Optional[ProjectState],
-        prior_errors: Optional[List[str]],
-        validation_logs: Optional[List[Any]],
-    ) -> GeneratedChecklist:
-        """Generate a remediation checklist to fix outstanding errors."""
-        if project_state is None:
-            project_state = ProjectState()
-        debug_prompt = self._build_debug_prompt(
-            context=context,
-            project_state=project_state,
-            prior_errors=prior_errors or [],
-            validation_logs=validation_logs or [],
-        )
-        system_prompt = CHECKLIST_SYSTEM_PROMPT.format(
-            catalog_prompt=get_catalog_prompt()
-        )
-        full_prompt = f"{system_prompt}\n\n## Remediation Context\n\n{debug_prompt}"
-        return self._generate_from_prompt(full_prompt)
-    def _generate_from_prompt(self, full_prompt: str) -> GeneratedChecklist:
-        """Common checklist generation logic with retries."""
-        logger.debug("Generating checklist with LLM...")
-        logger.debug(f"Checklist prompt: {full_prompt}")
-        max_attempts = 3
-        last_failure_reason = "unknown error"
-        for attempt in range(1, max_attempts + 1):
-            try:
-                response = self.chat.send(full_prompt, timeout=1200)
-                response_text = self._extract_response_text(response)
-                logger.debug(f"LLM response (attempt {attempt}): {response_text}")
-                checklist = self._parse_checklist(response_text)
-            except Exception as exc:  # pylint: disable=broad-exception-caught
-                last_failure_reason = str(exc)
-                logger.warning(
-                    "Checklist generation attempt %d/%d failed: %s",
-                    attempt,
-                    max_attempts,
-                    exc,
-                )
-                continue
-            if not checklist.items:
-                last_failure_reason = "LLM returned an empty checklist"
-                logger.warning(
-                    "Checklist generation attempt %d/%d returned no items, retrying...",
-                    attempt,
-                    max_attempts,
-                )
-                continue
-            self._validate_checklist(checklist)
-            if checklist.validation_errors:
-                last_failure_reason = "; ".join(checklist.validation_errors)
-                logger.warning(
-                    "Checklist generation attempt %d/%d failed validation: %s",
-                    attempt,
-                    max_attempts,
-                    checklist.validation_errors,
-                )
-                continue
-            logger.debug(
-                "Generated checklist with %d items on attempt %d",
-                len(checklist.items),
-                attempt,
-            )
-            return checklist
-        raise RuntimeError(
-            f"Failed to generate a valid checklist after {max_attempts} attempts: "
-            f"{last_failure_reason}"
-        )
-    def _build_initial_prompt(
-        self,
-        context: UserContext,
-        project_state: ProjectState,
-    ) -> str:
-        """Build the user prompt with all context.
-        Args:
-            context: User context
-            project_state: Current project state
-        Returns:
-            Formatted user prompt string
-        """
-        lines = [f"**User Request**: {context.user_request}"]
-        if context.entity_name:
-            lines.append(f"\n**Inferred Entity**: {context.entity_name}")
-        if context.schema_fields:
-            lines.append(f"\n**Inferred Fields**: {json.dumps(context.schema_fields)}")
-        lines.append(f"\n**Project Directory**: {context.project_dir}")
-        lines.append(f"\n**Language**: {context.language}")
-        lines.append(f"\n**Project Type**: {context.project_type}")
-        lines.append(f"\n{project_state.to_prompt()}")
-        if context.fix_feedback:
-            lines.append("\n**Outstanding Fix Requests**:")
-            for note in context.fix_feedback[-5:]:
-                lines.append(f"- {note}")
-        if context.validation_reports:
-            lines.append("\n**Recent Validation/Test Findings**:")
-            for log in context.validation_reports[-5:]:
-                status = "PASS" if log.get("success", True) else "FAIL"
-                template = log.get("template", "validation_step")
-                description = log.get("description", "")
-                lines.append(f"- [{status}] {template}: {description}")
-                if log.get("error"):
-                    lines.append(f"  Error: {log['error']}")
-                output = log.get("output", {})
-                snippet = ""
-                if isinstance(output, dict):
-                    for key in ("stdout", "stderr", "message", "details"):
-                        if output.get(key):
-                            snippet = str(output[key])[:200]
-                            break
-                    if not snippet and output:
-                        snippet = json.dumps(output)[:200]
-                elif output:
-                    snippet = str(output)[:200]
-                if snippet:
-                    lines.append(f"  Output: {snippet}")
-        lines.append("\nGenerate a checklist to fulfill this request.")
-        return "\n".join(lines)
-    def _build_debug_prompt(
-        self,
-        context: UserContext,
-        project_state: ProjectState,
-        prior_errors: List[str],
-        validation_logs: List[Any],
-    ) -> str:
-        """Build prompt for remediation/debug checklists."""
-        lines = [
-            "You are a remediation planner for the GAIA web development agent. "
-            "The project has already been scaffolded; focus exclusively on fixing outstanding issues."
-        ]
-        lines.append(f"\n**User Request**: {context.user_request}")
-        lines.append(f"\n**Project Directory**: {context.project_dir}")
-        if context.entity_name:
-            lines.append(f"\n**Entity**: {context.entity_name}")
-        if context.schema_fields:
-            lines.append(f"\n**Schema Fields**: {json.dumps(context.schema_fields)}")
-        lines.append(f"\n{project_state.to_prompt()}")
-        if prior_errors:
-            lines.append("\n**Execution Errors From Last Attempt:**")
-            for err in prior_errors:
-                lines.append(f"- {err}")
-        if validation_logs:
-            lines.append("\n**Recent Validation/Test Results:**")
-            raw_entries = []
-            for log in validation_logs[-10:]:
-                entry = log.to_dict() if hasattr(log, "to_dict") else log
-                template = entry.get("template", "unknown_step")
-                success = entry.get("success", True)
-                desc = entry.get("description", "")
-                status = "PASS" if success else "FAIL"
-                lines.append(f"- [{status}] {template}: {desc}")
-                if entry.get("error"):
-                    lines.append(f"  Error: {entry['error']}")
-                output = entry.get("output") or {}
-                for key in ("stdout", "stderr", "details", "message"):
-                    if output.get(key):
-                        snippet = str(output[key])[:200]
-                        lines.append(f"  Output: {snippet}")
-                        break
-                raw_entries.append(entry)
-            if raw_entries:
-                lines.append(
-                    "\n**Raw Validation Logs (exact text for follow-up fixes):**"
-                )
-                for entry in raw_entries:
-                    lines.append(json.dumps(entry, ensure_ascii=False))
-        if context.fix_feedback:
-            lines.append("\n**Outstanding Fix Instructions:**")
-            for note in context.fix_feedback[-10:]:
-                lines.append(f"- {note}")
-        lines.append(
-            "\nYour job: draft a concise checklist that repairs the errors above, "
-            "regenerates any broken code, and re-runs critical validations."
-        )
-        lines.append(
-            "\n**Critical Requirements for Debug Checklists:**\n"
-            "1. Use `fix_code` to repair the specific files referenced in the failures above.\n"
-            "2. Re-run any validations or tests that previously failed once fixes are applied.\n"
-            "3. Always include `run_typescript_check` as the second-to-last command to capture current compiler errors.\n"
-            "4. Always include `validate_styles` as the final command to capture CSS/design regressions."
-        )
-        return "\n".join(lines)
-    def _extract_response_text(self, response: Any) -> str:
-        """Extract text from LLM response.
-        Handles different response formats from various SDKs.
-        Args:
-            response: Response from chat SDK
-        Returns:
-            Response text string
-        """
-        if isinstance(response, str):
-            return response
-        # Handle response objects with text attribute
-        if hasattr(response, "text"):
-            return response.text
-        # Handle response objects with content attribute
-        if hasattr(response, "content"):
-            return response.content
-        # Handle dict-like responses
-        if isinstance(response, dict):
-            return response.get("text", response.get("content", str(response)))
-        return str(response)
-    def _parse_checklist(self, response_text: str) -> GeneratedChecklist:
-        """Parse LLM response into GeneratedChecklist.
-        Args:
-            response_text: Raw LLM response text
-        Returns:
-            Parsed GeneratedChecklist
-        """
-        try:
-            # Try to extract JSON from the response
-            json_str = self._extract_json(response_text)
-            data = json.loads(json_str)
-            # Parse items
-            items = []
-            for item_data in data.get("checklist", []):
-                item = ChecklistItem(
-                    template=item_data.get("template", ""),
-                    params=item_data.get("params", {}),
-                    description=item_data.get("description", ""),
-                )
-                items.append(item)
-            return GeneratedChecklist(
-                items=items,
-                reasoning=data.get("reasoning", ""),
-                raw_response=response_text,
-            )
-        except json.JSONDecodeError as e:
-            logger.error(f"Failed to parse checklist JSON: {e}")
-            return GeneratedChecklist(
-                items=[],
-                reasoning="",
-                raw_response=response_text,
-                validation_errors=[f"Failed to parse JSON: {str(e)}"],
-            )
-    def _extract_json(self, text: str) -> str:
-        """Extract JSON from text that might contain markdown or other content.
-        Args:
-            text: Text that may contain JSON
-        Returns:
-            Extracted JSON string
-        """
-        # Try to find JSON in markdown code block
-        code_block_match = re.search(r"```(?:json)?\s*\n?(.*?)\n?```", text, re.DOTALL)
-        if code_block_match:
-            return code_block_match.group(1).strip()
-        # Try to find raw JSON object
-        json_match = re.search(r"\{.*\}", text, re.DOTALL)
-        if json_match:
-            return json_match.group(0)
-        # Return as-is and let JSON parser handle it
-        return text.strip()
-    def _validate_checklist(self, checklist: GeneratedChecklist) -> None:
-        """Validate checklist items against template definitions.
-        Adds validation errors to the checklist if any are found.
-        Args:
-            checklist: Checklist to validate (modified in place)
-        """
-        for item in checklist.items:
-            errors = validate_checklist_item(item.template, item.params)
-            checklist.validation_errors.extend(errors)
-        # Check for duplicate templates (some are ok, like multiple API routes)
-        seen_templates = {}
-        for item in checklist.items:
-            key = f"{item.template}:{json.dumps(item.params, sort_keys=True)}"
-            if key in seen_templates:
-                checklist.validation_errors.append(
-                    f"Duplicate checklist item: {item.template} with same params"
-                )
-            seen_templates[key] = True
-        # Validate required setup: setup_app_styling must come after create_next_app
-        create_app_index = None
-        setup_styling_index = None
-        setup_testing_index = None
-        for i, item in enumerate(checklist.items):
-            if item.template == "create_next_app":
-                create_app_index = i
-            if item.template == "setup_app_styling":
-                setup_styling_index = i
-            if item.template == "setup_testing":
-                setup_testing_index = i
-        if create_app_index is not None:
-            if setup_styling_index is None:
-                checklist.validation_errors.append(
-                    "REQUIRED: 'setup_app_styling' must be included after 'create_next_app'"
-                )
-            elif setup_styling_index <= create_app_index:
-                checklist.validation_errors.append(
-                    "REQUIRED: 'setup_app_styling' must come after 'create_next_app' in the checklist"
-                )
-        # Validate required testing setup: setup_testing must come after setup_app_styling
-        if setup_styling_index is not None:
-            if setup_testing_index is None:
-                checklist.validation_errors.append(
-                    "REQUIRED: 'setup_testing' must be included after 'setup_app_styling'"
-                )
-            elif setup_testing_index <= setup_styling_index:
-                checklist.validation_errors.append(
-                    "REQUIRED: 'setup_testing' must come after 'setup_app_styling' in the checklist"
-                )
-        # Validate required final validation commands: run_typescript_check, validate_styles
-        if len(checklist.items) < 2:
-            checklist.validation_errors.append(
-                "REQUIRED: Checklist must end with 'run_typescript_check', "
-                "'validate_styles' as the last two commands"
-            )
-        else:
-            last_item = checklist.items[-1]
-            second_last_item = checklist.items[-2]
-            if last_item.template != "validate_styles":
-                checklist.validation_errors.append(
-                    "REQUIRED: The last command must be 'validate_styles'"
-                )
-            if second_last_item.template != "run_typescript_check":
-                checklist.validation_errors.append(
-                    "REQUIRED: The second-to-last command must be 'run_typescript_check'"
-                )
-        # Validate generate_style_tests is included (after setup_testing)
-        generate_style_tests_index = None
-        for i, item in enumerate(checklist.items):
-            if item.template == "generate_style_tests":
-                generate_style_tests_index = i
-        if setup_testing_index is not None and generate_style_tests_index is None:
-            checklist.validation_errors.append(
-                "REQUIRED: 'generate_style_tests' must be included after 'setup_testing'"
-            )
-        elif (
-            generate_style_tests_index is not None
-            and setup_testing_index is not None
-            and generate_style_tests_index <= setup_testing_index
-        ):
-            checklist.validation_errors.append(
-                "REQUIRED: 'generate_style_tests' must come after 'setup_testing'"
-            )
-        if checklist.validation_errors:
-            logger.warning(
-                f"Checklist validation errors: {checklist.validation_errors}"
-            )
-def create_checklist_from_workflow(
-    workflow_phases: List[Any],
-    context: UserContext,
-) -> GeneratedChecklist:
-    """Create a checklist from existing workflow phases (for comparison/testing).
-    This converts the old step-based workflow into the new checklist format,
-    useful for testing and migration.
-    Args:
-        workflow_phases: List of WorkflowPhase objects from factory
-        context: User context
-    Returns:
-        GeneratedChecklist representing the workflow
-    """
-    items = []
-    for phase in workflow_phases:
-        for step in phase.steps:
-            # Map step names to template names
-            template_map = {
-                "create_next_app": "create_next_app",
-                "setup_styling": "setup_app_styling",
-                "install_deps": "setup_prisma",
-                "setup_testing": "setup_testing",
-                "prisma_init": "setup_prisma",
-                "setup_prisma": "setup_prisma",
-                "manage_data_model": "generate_prisma_model",
-                "manage_api_endpoint": "generate_api_route",
-                "manage_api_endpoint_dynamic": "generate_api_route",
-                "manage_react_component": "generate_react_component",
-                "update_landing_page": "update_landing_page",
-                "validate_typescript": "run_typescript_check",
-                "validate_crud_structure": "run_typescript_check",
-                "test_crud_api": "run_typescript_check",
-            }
-            template_name = template_map.get(step.name, step.name)
-            # Extract params from step
-            params = {}
-            if hasattr(step, "get_tool_invocation"):
-                invocation = step.get_tool_invocation(context)
-                if invocation:
-                    _, step_params = invocation
-                    params = {
-                        k: v for k, v in step_params.items() if k != "project_dir"
-                    }
-            items.append(
-                ChecklistItem(
-                    template=template_name,
-                    params=params,
-                    description=step.description,
-                )
-            )
-    return GeneratedChecklist(
-        items=items,
-        reasoning="Converted from existing workflow",
-    )
+# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
+# SPDX-License-Identifier: MIT
+"""Checklist Generator for LLM-Driven Code Generation.
+This module uses an LLM to generate a checklist of template invocations
+based on the user's request and the available template catalog.
+The generator:
+1. Receives user request and project context
+2. Sends prompt to LLM with template catalog
+3. Parses LLM response into structured checklist
+4. Validates checklist items against template definitions
+The resulting checklist is then executed deterministically by
+ChecklistExecutor.
+"""
+import json
+import logging
+import re
+from dataclasses import dataclass, field
+from typing import Any, Dict, List, Optional, Protocol
+from .steps.base import UserContext
+from .template_catalog import get_catalog_prompt, validate_checklist_item
+logger = logging.getLogger(__name__)
+class ChatSDK(Protocol):
+    """Protocol for chat SDK interface."""
+    def send(self, message: str, timeout: int = 600, no_history: bool = False) -> Any:
+        """Send a message and get response."""
+        ...
+@dataclass
+class ChecklistItem:
+    """Single item in the generated checklist.
+    Represents a template invocation with its parameters and
+    the LLM's reasoning for including it.
+    """
+    template: str
+    params: Dict[str, Any]
+    description: str
+    def to_dict(self) -> Dict[str, Any]:
+        """Convert to dictionary representation."""
+        return {
+            "template": self.template,
+            "params": self.params,
+            "description": self.description,
+        }
+@dataclass
+class GeneratedChecklist:
+    """Complete checklist generated by LLM.
+    Contains the list of template invocations and the LLM's
+    overall reasoning for the chosen approach.
+    """
+    items: List[ChecklistItem]
+    reasoning: str
+    raw_response: str = ""
+    validation_errors: List[str] = field(default_factory=list)
+    @property
+    def is_valid(self) -> bool:
+        """Check if checklist passed validation."""
+        return len(self.validation_errors) == 0
+    def to_dict(self) -> Dict[str, Any]:
+        """Convert to dictionary representation."""
+        return {
+            "reasoning": self.reasoning,
+            "checklist": [item.to_dict() for item in self.items],
+            "is_valid": self.is_valid,
+            "validation_errors": self.validation_errors,
+        }
+@dataclass
+class ProjectState:
+    """Current state of the project for context."""
+    exists: bool = False
+    has_package_json: bool = False
+    has_prisma: bool = False
+    has_next_config: bool = False
+    existing_models: List[str] = field(default_factory=list)
+    existing_routes: List[str] = field(default_factory=list)
+    existing_pages: List[str] = field(default_factory=list)
+    def to_prompt(self) -> str:
+        """Generate prompt-friendly description of project state."""
+        if not self.exists:
+            return "Project does not exist yet - will be created fresh."
+        lines = ["Current project state:"]
+        if self.has_package_json:
+            lines.append("- ✓ package.json exists (Node.js project)")
+        if self.has_next_config:
+            lines.append("- ✓ next.config.ts exists (Next.js configured)")
+        if self.has_prisma:
+            lines.append("- ✓ Prisma configured")
+            if self.existing_models:
+                lines.append(f"  - Models: {', '.join(self.existing_models)}")
+        if self.existing_routes:
+            lines.append(f"- Existing API routes: {', '.join(self.existing_routes)}")
+        if self.existing_pages:
+            lines.append(f"- Existing pages: {', '.join(self.existing_pages)}")
+        return "\n".join(lines)
+CHECKLIST_SYSTEM_PROMPT = """You are a code generation planner. Your task is to analyze the user's request and generate a checklist of template invocations that will create the requested application.
+{catalog_prompt}
+## Instructions
+1. Analyze the user's request carefully
+2. Consider what the user ACTUALLY wants (semantic understanding)
+3. Select templates that will fulfill the request
+4. Add semantic enhancements based on the request type:
+   - For "todo" apps: add checkboxes for completion status
+   - For "blog" apps: add date fields for posts
+   - For "e-commerce": add price, inventory fields
+5. Ensure dependencies are satisfied (run setup before data, data before API, API before UI)
+6. Generate a complete checklist that creates a working application
+7. When follow-up fixes are requested, use `fix_code` to repair the specific files called out by validation/test logs. Extract the precise file paths and line numbers from the errors (see the Raw Validation Logs) and pass those line numbers inside the error description so the fixer knows exactly where to focus. Always reference the latest findings to decide which fixes to schedule before running validations again.
+8. If the user explicitly requests an additional UI artifact (countdown display, stats badge, etc.), schedule a `generate_react_component` step with the appropriate `artifact-*` variant (e.g., `"artifact-timer"`) and a descriptive `component_name`. Keep the artifact's logic inside that client component—server components like `page.tsx` should only render the artifact and pass any required props.
+9. **Route pairing requirement:** Whenever you schedule `{{"template": "generate_api_route", "params": {{"type": "collection", ...}}}}`, you MUST also include a matching `generate_api_route` item with `"type": "item"` for the same resource so detail pages can call `/api/<resource>/[id]`.
+This workflow repeats until all validations pass, so each checklist should either advance new functionality or explicitly repair the failures reported in the latest validation logs.
+## IMPORTANT: Complete CRUD Applications
+For any app that manages resources (todos, posts, users, etc.), you MUST generate ALL of these UI components:
+1. **Form component** (variant: "form") - Reusable form for create (generate this first so other pages can import it)
+2. **Artifact components** (variant: "artifact-*") - Any additional UI artifacts requested by the user (e.g., countdown display, stats badge). Generate these before any page that consumes them.
+3. **New page** (variant: "new") - Create new item at /resources/new
+4. **Edit page** (variant: "detail") - Edit single item at /resources/[id] with pre-populated form
+5. **List page** (variant: "list") - Main page showing all items at /resources
+Missing any of the required components (form, new, detail, list) will result in broken navigation! When artifacts are requested, they must also be generated or the UI will be incomplete.
+## REQUIRED: Setup and Validation Commands
+**CRITICAL**: The following commands are REQUIRED for a valid plan:
+1. **setup_app_styling** MUST be included after creating the application (after `create_next_app`). This configures app-wide styling with modern dark theme design system.
+2. **setup_testing** MUST be included after `setup_app_styling`. This sets up the testing infrastructure.
+3. **generate_style_tests** MUST be included after `setup_testing`. This generates CSS integrity tests that validate the design system.
+4. **The final 2 commands MUST be in this exact order:**
+   - Second-to-last: `run_typescript_check` (validates TypeScript compilation)
+   - Last: `validate_styles` (validates CSS files and design system)
+These setup and validation commands are mandatory - a plan without them is INVALID.
+## Output Format
+Respond with ONLY a JSON object (no markdown code blocks):
+{{
+  "reasoning": "Brief explanation of your approach and any semantic enhancements",
+  "checklist": [
+    {{"template": "template_name", "params": {{}}, "description": "Why this step is needed"}}
+  ]
+}}
+Important:
+- Use exact template names from the catalog
+- Provide all required parameters
+- Order items by dependency (setup first, then data, then API, then UI)
+- REQUIRED ordering for `generate_react_component`: emit all non-`list` variants (form, new, detail, actions, artifact-*) before the `variant: "list"` call so the list can import previously generated components
+- Add semantic enhancements that make the app intuitive (e.g., checkboxes for todos)
+- For CRUD apps, ALWAYS include all 4 UI variants: list, form, new, detail
+- REQUIRED: Include `setup_app_styling` after `create_next_app`
+- REQUIRED: Include `setup_testing` after `setup_app_styling`
+- REQUIRED: Include `generate_style_tests` after `setup_testing`
+- REQUIRED: End with `run_typescript_check`, then `validate_styles` as the last 2 commands
+- When converting a raw validation error into `fix_code`, copy the exact snippet (file, line, column, and message). For example:
+  Raw Validation Logs (example):
+  ```
+  {{"template": "run_typescript_check", "output": {{"errors": "path/to/File.tsx(10,5): error TS1234: <error text>\\n"}}}}
+  ```
+  Corresponding checklist item:
+  ```
+  {{
+    "template": "fix_code",
+    "params": {{
+      "file_path": "path/to/File.tsx",
+      "error_description": "path/to/File.tsx(10,5): error TS1234: <error text>"
+    }},
+    "description": "Fix the TypeScript compiler error reported for File.tsx."
+  }}
+  ```
+  Always keep the error text verbatim so the fixer knows exactly where to edit."""
+class ChecklistGenerator:
+    """Generate execution checklist using LLM.
+    The generator sends the user request, project state, and template
+    catalog to an LLM, which returns a structured checklist of template
+    invocations.
+    """
+    def __init__(self, chat_sdk: ChatSDK):
+        """Initialize the checklist generator.
+        Args:
+            chat_sdk: Chat SDK instance for LLM communication
+        """
+        self.chat = chat_sdk
+    def generate_initial_checklist(
+        self,
+        context: UserContext,
+        project_state: Optional[ProjectState] = None,
+    ) -> GeneratedChecklist:
+        """Generate the initial project-scaffolding checklist."""
+        if project_state is None:
+            project_state = ProjectState()
+        system_prompt = CHECKLIST_SYSTEM_PROMPT.format(
+            catalog_prompt=get_catalog_prompt()
+        )
+        user_prompt = self._build_initial_prompt(context, project_state)
+        full_prompt = f"{system_prompt}\n\n## User Request\n\n{user_prompt}"
+        return self._generate_from_prompt(full_prompt)
+    def generate_debug_checklist(
+        self,
+        context: UserContext,
+        project_state: Optional[ProjectState],
+        prior_errors: Optional[List[str]],
+        validation_logs: Optional[List[Any]],
+    ) -> GeneratedChecklist:
+        """Generate a remediation checklist to fix outstanding errors."""
+        if project_state is None:
+            project_state = ProjectState()
+        debug_prompt = self._build_debug_prompt(
+            context=context,
+            project_state=project_state,
+            prior_errors=prior_errors or [],
+            validation_logs=validation_logs or [],
+        )
+        system_prompt = CHECKLIST_SYSTEM_PROMPT.format(
+            catalog_prompt=get_catalog_prompt()
+        )
+        full_prompt = f"{system_prompt}\n\n## Remediation Context\n\n{debug_prompt}"
+        return self._generate_from_prompt(full_prompt)
+    def _generate_from_prompt(self, full_prompt: str) -> GeneratedChecklist:
+        """Common checklist generation logic with retries."""
+        logger.debug("Generating checklist with LLM...")
+        logger.debug(f"Checklist prompt: {full_prompt}")
+        max_attempts = 3
+        last_failure_reason = "unknown error"
+        for attempt in range(1, max_attempts + 1):
+            try:
+                response = self.chat.send(full_prompt, timeout=1200)
+                response_text = self._extract_response_text(response)
+                logger.debug(f"LLM response (attempt {attempt}): {response_text}")
+                checklist = self._parse_checklist(response_text)
+            except Exception as exc:  # pylint: disable=broad-exception-caught
+                last_failure_reason = str(exc)
+                logger.warning(
+                    "Checklist generation attempt %d/%d failed: %s",
+                    attempt,
+                    max_attempts,
+                    exc,
+                )
+                continue
+            if not checklist.items:
+                last_failure_reason = "LLM returned an empty checklist"
+                logger.warning(
+                    "Checklist generation attempt %d/%d returned no items, retrying...",
+                    attempt,
+                    max_attempts,
+                )
+                continue
+            self._validate_checklist(checklist)
+            if checklist.validation_errors:
+                last_failure_reason = "; ".join(checklist.validation_errors)
+                logger.warning(
+                    "Checklist generation attempt %d/%d failed validation: %s",
+                    attempt,
+                    max_attempts,
+                    checklist.validation_errors,
+                )
+                continue
+            logger.debug(
+                "Generated checklist with %d items on attempt %d",
+                len(checklist.items),
+                attempt,
+            )
+            return checklist
+        raise RuntimeError(
+            f"Failed to generate a valid checklist after {max_attempts} attempts: "
+            f"{last_failure_reason}"
+        )
+    def _build_initial_prompt(
+        self,
+        context: UserContext,
+        project_state: ProjectState,
+    ) -> str:
+        """Build the user prompt with all context.
+        Args:
+            context: User context
+            project_state: Current project state
+        Returns:
+            Formatted user prompt string
+        """
+        lines = [f"**User Request**: {context.user_request}"]
+        if context.entity_name:
+            lines.append(f"\n**Inferred Entity**: {context.entity_name}")
+        if context.schema_fields:
+            lines.append(f"\n**Inferred Fields**: {json.dumps(context.schema_fields)}")
+        lines.append(f"\n**Project Directory**: {context.project_dir}")
+        lines.append(f"\n**Language**: {context.language}")
+        lines.append(f"\n**Project Type**: {context.project_type}")
+        lines.append(f"\n{project_state.to_prompt()}")
+        if context.fix_feedback:
+            lines.append("\n**Outstanding Fix Requests**:")
+            for note in context.fix_feedback[-5:]:
+                lines.append(f"- {note}")
+        if context.validation_reports:
+            lines.append("\n**Recent Validation/Test Findings**:")
+            for log in context.validation_reports[-5:]:
+                status = "PASS" if log.get("success", True) else "FAIL"
+                template = log.get("template", "validation_step")
+                description = log.get("description", "")
+                lines.append(f"- [{status}] {template}: {description}")
+                if log.get("error"):
+                    lines.append(f"  Error: {log['error']}")
+                output = log.get("output", {})
+                snippet = ""
+                if isinstance(output, dict):
+                    for key in ("stdout", "stderr", "message", "details"):
+                        if output.get(key):
+                            snippet = str(output[key])[:200]
+                            break
+                    if not snippet and output:
+                        snippet = json.dumps(output)[:200]
+                elif output:
+                    snippet = str(output)[:200]
+                if snippet:
+                    lines.append(f"  Output: {snippet}")
+        lines.append("\nGenerate a checklist to fulfill this request.")
+        return "\n".join(lines)
+    def _build_debug_prompt(
+        self,
+        context: UserContext,
+        project_state: ProjectState,
+        prior_errors: List[str],
+        validation_logs: List[Any],
+    ) -> str:
+        """Build prompt for remediation/debug checklists."""
+        lines = [
+            "You are a remediation planner for the GAIA web development agent. "
+            "The project has already been scaffolded; focus exclusively on fixing outstanding issues."
+        ]
+        lines.append(f"\n**User Request**: {context.user_request}")
+        lines.append(f"\n**Project Directory**: {context.project_dir}")
+        if context.entity_name:
+            lines.append(f"\n**Entity**: {context.entity_name}")
+        if context.schema_fields:
+            lines.append(f"\n**Schema Fields**: {json.dumps(context.schema_fields)}")
+        lines.append(f"\n{project_state.to_prompt()}")
+        if prior_errors:
+            lines.append("\n**Execution Errors From Last Attempt:**")
+            for err in prior_errors:
+                lines.append(f"- {err}")
+        if validation_logs:
+            lines.append("\n**Recent Validation/Test Results:**")
+            raw_entries = []
+            for log in validation_logs[-10:]:
+                entry = log.to_dict() if hasattr(log, "to_dict") else log
+                template = entry.get("template", "unknown_step")
+                success = entry.get("success", True)
+                desc = entry.get("description", "")
+                status = "PASS" if success else "FAIL"
+                lines.append(f"- [{status}] {template}: {desc}")
+                if entry.get("error"):
+                    lines.append(f"  Error: {entry['error']}")
+                output = entry.get("output") or {}
+                for key in ("stdout", "stderr", "details", "message"):
+                    if output.get(key):
+                        snippet = str(output[key])[:200]
+                        lines.append(f"  Output: {snippet}")
+                        break
+                raw_entries.append(entry)
+            if raw_entries:
+                lines.append(
+                    "\n**Raw Validation Logs (exact text for follow-up fixes):**"
+                )
+                for entry in raw_entries:
+                    lines.append(json.dumps(entry, ensure_ascii=False))
+        if context.fix_feedback:
+            lines.append("\n**Outstanding Fix Instructions:**")
+            for note in context.fix_feedback[-10:]:
+                lines.append(f"- {note}")
+        lines.append(
+            "\nYour job: draft a concise checklist that repairs the errors above, "
+            "regenerates any broken code, and re-runs critical validations."
+        )
+        lines.append(
+            "\n**Critical Requirements for Debug Checklists:**\n"
+            "1. Use `fix_code` to repair the specific files referenced in the failures above.\n"
+            "2. Re-run any validations or tests that previously failed once fixes are applied.\n"
+            "3. Always include `run_typescript_check` as the second-to-last command to capture current compiler errors.\n"
+            "4. Always include `validate_styles` as the final command to capture CSS/design regressions."
+        )
+        return "\n".join(lines)
+    def _extract_response_text(self, response: Any) -> str:
+        """Extract text from LLM response.
+        Handles different response formats from various SDKs.
+        Args:
+            response: Response from chat SDK
+        Returns:
+            Response text string
+        """
+        if isinstance(response, str):
+            return response
+        # Handle response objects with text attribute
+        if hasattr(response, "text"):
+            return response.text
+        # Handle response objects with content attribute
+        if hasattr(response, "content"):
+            return response.content
+        # Handle dict-like responses
+        if isinstance(response, dict):
+            return response.get("text", response.get("content", str(response)))
+        return str(response)
+    def _parse_checklist(self, response_text: str) -> GeneratedChecklist:
+        """Parse LLM response into GeneratedChecklist.
+        Args:
+            response_text: Raw LLM response text
+        Returns:
+            Parsed GeneratedChecklist
+        """
+        try:
+            # Try to extract JSON from the response
+            json_str = self._extract_json(response_text)
+            data = json.loads(json_str)
+            # Parse items
+            items = []
+            for item_data in data.get("checklist", []):
+                item = ChecklistItem(
+                    template=item_data.get("template", ""),
+                    params=item_data.get("params", {}),
+                    description=item_data.get("description", ""),
+                )
+                items.append(item)
+            return GeneratedChecklist(
+                items=items,
+                reasoning=data.get("reasoning", ""),
+                raw_response=response_text,
+            )
+        except json.JSONDecodeError as e:
+            logger.error(f"Failed to parse checklist JSON: {e}")
+            return GeneratedChecklist(
+                items=[],
+                reasoning="",
+                raw_response=response_text,
+                validation_errors=[f"Failed to parse JSON: {str(e)}"],
+            )
+    def _extract_json(self, text: str) -> str:
+        """Extract JSON from text that might contain markdown or other content.
+        Args:
+            text: Text that may contain JSON
+        Returns:
+            Extracted JSON string
+        """
+        # Try to find JSON in markdown code block
+        code_block_match = re.search(r"```(?:json)?\s*\n?(.*?)\n?```", text, re.DOTALL)
+        if code_block_match:
+            return code_block_match.group(1).strip()
+        # Try to find raw JSON object
+        json_match = re.search(r"\{.*\}", text, re.DOTALL)
+        if json_match:
+            return json_match.group(0)
+        # Return as-is and let JSON parser handle it
+        return text.strip()
+    def _validate_checklist(self, checklist: GeneratedChecklist) -> None:
+        """Validate checklist items against template definitions.
+        Adds validation errors to the checklist if any are found.
+        Args:
+            checklist: Checklist to validate (modified in place)
+        """
+        for item in checklist.items:
+            errors = validate_checklist_item(item.template, item.params)
+            checklist.validation_errors.extend(errors)
+        # Check for duplicate templates (some are ok, like multiple API routes)
+        seen_templates = {}
+        for item in checklist.items:
+            key = f"{item.template}:{json.dumps(item.params, sort_keys=True)}"
+            if key in seen_templates:
+                checklist.validation_errors.append(
+                    f"Duplicate checklist item: {item.template} with same params"
+                )
+            seen_templates[key] = True
+        # Validate required setup: setup_app_styling must come after create_next_app
+        create_app_index = None
+        setup_styling_index = None
+        setup_testing_index = None
+        for i, item in enumerate(checklist.items):
+            if item.template == "create_next_app":
+                create_app_index = i
+            if item.template == "setup_app_styling":
+                setup_styling_index = i
+            if item.template == "setup_testing":
+                setup_testing_index = i
+        if create_app_index is not None:
+            if setup_styling_index is None:
+                checklist.validation_errors.append(
+                    "REQUIRED: 'setup_app_styling' must be included after 'create_next_app'"
+                )
+            elif setup_styling_index <= create_app_index:
+                checklist.validation_errors.append(
+                    "REQUIRED: 'setup_app_styling' must come after 'create_next_app' in the checklist"
+                )
+        # Validate required testing setup: setup_testing must come after setup_app_styling
+        if setup_styling_index is not None:
+            if setup_testing_index is None:
+                checklist.validation_errors.append(
+                    "REQUIRED: 'setup_testing' must be included after 'setup_app_styling'"
+                )
+            elif setup_testing_index <= setup_styling_index:
+                checklist.validation_errors.append(
+                    "REQUIRED: 'setup_testing' must come after 'setup_app_styling' in the checklist"
+                )
+        # Validate required final validation commands: run_typescript_check, validate_styles
+        if len(checklist.items) < 2:
+            checklist.validation_errors.append(
+                "REQUIRED: Checklist must end with 'run_typescript_check', "
+                "'validate_styles' as the last two commands"
+            )
+        else:
+            last_item = checklist.items[-1]
+            second_last_item = checklist.items[-2]
+            if last_item.template != "validate_styles":
+                checklist.validation_errors.append(
+                    "REQUIRED: The last command must be 'validate_styles'"
+                )
+            if second_last_item.template != "run_typescript_check":
+                checklist.validation_errors.append(
+                    "REQUIRED: The second-to-last command must be 'run_typescript_check'"
+                )
+        # Validate generate_style_tests is included (after setup_testing)
+        generate_style_tests_index = None
+        for i, item in enumerate(checklist.items):
+            if item.template == "generate_style_tests":
+                generate_style_tests_index = i
+        if setup_testing_index is not None and generate_style_tests_index is None:
+            checklist.validation_errors.append(
+                "REQUIRED: 'generate_style_tests' must be included after 'setup_testing'"
+            )
+        elif (
+            generate_style_tests_index is not None
+            and setup_testing_index is not None
+            and generate_style_tests_index <= setup_testing_index
+        ):
+            checklist.validation_errors.append(
+                "REQUIRED: 'generate_style_tests' must come after 'setup_testing'"
+            )
+        if checklist.validation_errors:
+            logger.warning(
+                f"Checklist validation errors: {checklist.validation_errors}"
+            )
+def create_checklist_from_workflow(
+    workflow_phases: List[Any],
+    context: UserContext,
+) -> GeneratedChecklist:
+    """Create a checklist from existing workflow phases (for comparison/testing).
+    This converts the old step-based workflow into the new checklist format,
+    useful for testing and migration.
+    Args:
+        workflow_phases: List of WorkflowPhase objects from factory
+        context: User context
+    Returns:
+        GeneratedChecklist representing the workflow
+    """
+    items = []
+    for phase in workflow_phases:
+        for step in phase.steps:
+            # Map step names to template names
+            template_map = {
+                "create_next_app": "create_next_app",
+                "setup_styling": "setup_app_styling",
+                "install_deps": "setup_prisma",
+                "setup_testing": "setup_testing",
+                "prisma_init": "setup_prisma",
+                "setup_prisma": "setup_prisma",
+                "manage_data_model": "generate_prisma_model",
+                "manage_api_endpoint": "generate_api_route",
+                "manage_api_endpoint_dynamic": "generate_api_route",
+                "manage_react_component": "generate_react_component",
+                "update_landing_page": "update_landing_page",
+                "validate_typescript": "run_typescript_check",
+                "validate_crud_structure": "run_typescript_check",
+                "test_crud_api": "run_typescript_check",
+            }
+            template_name = template_map.get(step.name, step.name)
+            # Extract params from step
+            params = {}
+            if hasattr(step, "get_tool_invocation"):
+                invocation = step.get_tool_invocation(context)
+                if invocation:
+                    _, step_params = invocation
+                    params = {
+                        k: v for k, v in step_params.items() if k != "project_dir"
+                    }
+            items.append(
+                ChecklistItem(
+                    template=template_name,
+                    params=params,
+                    description=step.description,
+                )
+            )
+    return GeneratedChecklist(
+        items=items,
+        reasoning="Converted from existing workflow",
+    )

amd-gaia 0.14.3__py3-none-any.whl → 0.15.1__py3-none-any.whl

amd-gaia 0.14.3py3-none-any.whl → 0.15.1py3-none-any.whl