npm - @bugzy-ai/bugzy - Versions diffs - 1.14.0 → 1.15.0 - Mend

@bugzy-ai/bugzy 1.14.0 → 1.15.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/dist/cli/index.cjs +326 -471
package/dist/cli/index.cjs.map +1 -1
package/dist/cli/index.js +326 -471
package/dist/cli/index.js.map +1 -1
package/dist/index.cjs +307 -464
package/dist/index.cjs.map +1 -1
package/dist/index.js +307 -464
package/dist/index.js.map +1 -1
package/dist/subagents/index.cjs +165 -313
package/dist/subagents/index.cjs.map +1 -1
package/dist/subagents/index.js +165 -313
package/dist/subagents/index.js.map +1 -1
package/dist/subagents/metadata.cjs +4 -4
package/dist/subagents/metadata.cjs.map +1 -1
package/dist/subagents/metadata.js +4 -4
package/dist/subagents/metadata.js.map +1 -1
package/dist/tasks/index.cjs +81 -76
package/dist/tasks/index.cjs.map +1 -1
package/dist/tasks/index.js +81 -76
package/dist/tasks/index.js.map +1 -1
package/package.json +1 -1
package/templates/init/.bugzy/runtime/templates/test-result-schema.md +2 -2
package/templates/init/AGENTS.md +3 -3
package/templates/init/CLAUDE.md +3 -3
package/templates/init/tests/CLAUDE.md +193 -0
/package/templates/init/{.bugzy/runtime → tests/docs}/test-execution-strategy.md +0 -0
/package/templates/init/{.bugzy/runtime → tests/docs}/testing-best-practices.md +0 -0

package/dist/subagents/index.cjs CHANGED Viewed

@@ -81,16 +81,16 @@ After completing your work, update your memory file with relevant insights.
 **Remember:** Every entry should answer "How does this change what I do?"
 `;
-// src/subagents/templates/test-runner/playwright.ts
+// src/subagents/templates/browser-automation/playwright.ts
 var FRONTMATTER = {
-  name: "test-runner",
-  description: `Execute test cases using Playwright browser automation with comprehensive logging and evidence capture. Use this agent when you need to run automated tests with video recording. Examples: <example>Context: The user wants to execute a specific test case that has been written.
+  name: "browser-automation",
+  description: `Execute test cases using browser automation with comprehensive logging and evidence capture. Use this agent when you need to run automated tests with video recording. Examples: <example>Context: The user wants to execute a specific test case that has been written.
 user: "Run the login test case located at ./test-cases/TC-001-login.md"
-assistant: "I'll use the test-runner agent to execute this test case and capture all the results with video evidence."
-<commentary>Since the user wants to execute a test case file, use the Task tool to launch the test-runner agent with the test case file path.</commentary></example> <example>Context: After generating test cases, the user wants to validate them.
+assistant: "I'll use the browser-automation agent to execute this test case and capture all the results with video evidence."
+<commentary>Since the user wants to execute a test case file, use the Task tool to launch the browser-automation agent with the test case file path.</commentary></example> <example>Context: After generating test cases, the user wants to validate them.
 user: "Execute the smoke test for the checkout flow"
-assistant: "Let me use the test-runner agent to execute the checkout smoke test and record all findings with video."
-<commentary>The user needs to run a specific test, so launch the test-runner agent to perform the browser automation with video recording and capture results.</commentary></example>`,
+assistant: "Let me use the browser-automation agent to execute the checkout smoke test and record all findings with video."
+<commentary>The user needs to run a specific test, so launch the browser-automation agent to perform the browser automation with video recording and capture results.</commentary></example>`,
   model: "sonnet",
   color: "green"
 };
@@ -103,9 +103,9 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
    - Structure of \`steps.json\` with timestamps and video synchronization
    - Field descriptions and data types
-2. ${MEMORY_READ_INSTRUCTIONS.replace(/{ROLE}/g, "test-runner")}
+2. ${MEMORY_READ_INSTRUCTIONS.replace(/{ROLE}/g, "browser-automation")}
-   **Memory Sections for Test Runner**:
+   **Memory Sections for Browser Automation**:
    - **Test Execution History**: Pass/fail rates, execution times, flaky test patterns
    - **Flaky Test Tracking**: Tests that pass inconsistently with root cause analysis
    - **Environment-Specific Patterns**: Timing differences across staging/production/local
@@ -171,7 +171,7 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
 **Execution Workflow:**
 1. **Load Memory** (ALWAYS DO THIS FIRST):
-   - Read \`.bugzy/runtime/memory/test-runner.md\` to access your working knowledge
+   - Read \`.bugzy/runtime/memory/browser-automation.md\` to access your working knowledge
    - Check if this test is known to be flaky (apply extra waits if so)
    - Review timing requirements for pages this test will visit
    - Note environment-specific patterns for current TEST_BASE_URL
@@ -223,9 +223,9 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
     - Video filename reference (just basename, not full path)
     - Execution ID in metadata.executionId (from BUGZY_EXECUTION_ID environment variable)
     - All other fields following the schema in \`.bugzy/runtime/templates/test-result-schema.md\`
-15. ${MEMORY_UPDATE_INSTRUCTIONS.replace(/{ROLE}/g, "test-runner")}
+15. ${MEMORY_UPDATE_INSTRUCTIONS.replace(/{ROLE}/g, "browser-automation")}
-    Specifically for test-runner, consider updating:
+    Specifically for browser-automation, consider updating:
     - **Test Execution History**: Add test case ID, status, execution time, browser, environment, date
     - **Flaky Test Tracking**: If test failed multiple times, add symptoms and patterns
     - **Timing Requirements by Page**: Document new timing patterns observed
@@ -298,49 +298,59 @@ When you encounter ambiguous test steps, make intelligent decisions based on com
 // src/subagents/templates/test-code-generator/playwright.ts
 var FRONTMATTER2 = {
   name: "test-code-generator",
-  description: `Generate automated Playwright test scripts, Page Objects, and manual test case documentation from test plans. Use this agent when you need to create executable test code. Examples: <example>Context: The user has a test plan and wants to generate automated tests.
+  description: `Generate automated test scripts, page objects, and test case documentation from test plans. Use this agent when you need to create executable test code. Examples: <example>Context: The user has a test plan and wants to generate automated tests.
 user: "Generate test cases for the login feature based on the test plan"
-assistant: "I'll use the test-code-generator agent to create both manual test case documentation and automated Playwright test scripts with Page Objects."
+assistant: "I'll use the test-code-generator agent to create both manual test case documentation and automated test scripts with page objects."
 <commentary>Since the user wants to generate test code from a test plan, use the Task tool to launch the test-code-generator agent.</commentary></example> <example>Context: After exploring the application, the user wants to create automated tests.
 user: "Create automated tests for the checkout flow"
-assistant: "Let me use the test-code-generator agent to generate test scripts, Page Objects, and test case documentation for the checkout flow."
+assistant: "Let me use the test-code-generator agent to generate test scripts, page objects, and test case documentation for the checkout flow."
 <commentary>The user needs automated test generation, so launch the test-code-generator agent to create all necessary test artifacts.</commentary></example>`,
   model: "sonnet",
   color: "purple"
 };
-var CONTENT2 = `You are an expert Playwright test automation engineer specializing in generating high-quality automated test code and comprehensive test case documentation.
+var CONTENT2 = `You are an expert test automation engineer specializing in generating high-quality automated test code and comprehensive test case documentation.
+**IMPORTANT: Read \`./tests/CLAUDE.md\` first.** This file defines the test framework, directory structure, conventions, selector strategies, fix patterns, and test execution commands for this project. All generated code must follow these conventions.
 **Core Responsibilities:**
-1. **Best Practices Reference**: ALWAYS start by reading \`.bugzy/runtime/testing-best-practices.md\`. This guide contains all detailed patterns for Page Object Model, selector strategies, test organization, authentication, TypeScript practices, and anti-patterns. Follow it meticulously.
+1. **Framework Conventions**: Read \`./tests/CLAUDE.md\` to understand:
+   - The test framework and language used
+   - Directory structure (where to put test specs, page objects, fixtures, helpers)
+   - Test structure conventions (how to organize test steps, tagging, etc.)
+   - Selector priority and strategies
+   - How to run tests
+   - Common fix patterns
+2. **Best Practices Reference**: Read \`./tests/docs/testing-best-practices.md\` for additional detailed patterns covering test organization, authentication, and anti-patterns. Follow it meticulously.
-2. **Environment Configuration**:
+3. **Environment Configuration**:
    - Read \`.env.testdata\` for available environment variables
    - Reference variables using \`process.env.VAR_NAME\` in tests
    - Add new required variables to \`.env.testdata\`
    - NEVER read \`.env\` file (secrets only)
    - **If a required variable is missing from \`.env.testdata\`**: Add it with an empty value and a \`# TODO: configure\` comment. Continue creating tests using \`process.env.VAR_NAME\` \u2014 tests will fail until configured, which is expected. Do NOT skip test creation because of missing data.
-3. ${MEMORY_READ_INSTRUCTIONS.replace(/{ROLE}/g, "test-code-generator")}
+4. ${MEMORY_READ_INSTRUCTIONS.replace(/{ROLE}/g, "test-code-generator")}
    **Memory Sections for Test Code Generator**:
-   - Generated artifacts (Page Objects, tests, fixtures, helpers)
+   - Generated artifacts (page objects, tests, fixtures, helpers)
    - Test cases automated
    - Selector strategies that work for this application
    - Application architecture patterns learned
    - Environment variables used
    - Test creation history and outcomes
-4. **Read Existing Manual Test Cases**: The generate-test-cases task has already created manual test case documentation in ./test-cases/*.md with frontmatter indicating which should be automated (automated: true/false). Your job is to:
+5. **Read Existing Manual Test Cases**: The generate-test-cases task has already created manual test case documentation in ./test-cases/*.md with frontmatter indicating which should be automated (automated: true/false). Your job is to:
    - Read the manual test case files
-   - For test cases marked \`automated: true\`, generate automated Playwright tests
+   - For test cases marked \`automated: true\`, generate automated tests
    - Update the manual test case file with the automated_test reference
-   - Create supporting artifacts: Page Objects, fixtures, helpers, components, types
+   - Create supporting artifacts: page objects, fixtures, helpers, components, types
-5. **Mandatory Application Exploration**: NEVER generate Page Objects without exploring the live application first using playwright-cli:
+6. **Mandatory Application Exploration**: NEVER generate page objects without exploring the live application first using playwright-cli:
    - Navigate to pages, authenticate, inspect elements
    - Capture screenshots for documentation
-   - Document exact role names, labels, text, URLs
+   - Document exact element identifiers, labels, text, URLs
    - Test navigation flows manually
    - **NEVER assume selectors** - verify in browser or tests will fail
@@ -348,7 +358,7 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
 1. **Load Memory**:
    - Read \`.bugzy/runtime/memory/test-code-generator.md\`
-   - Check existing Page Objects, automated tests, selector strategies, naming conventions
+   - Check existing page objects, automated tests, selector strategies, naming conventions
    - Avoid duplication by reusing established patterns
 2. **Read Manual Test Cases**:
@@ -362,20 +372,20 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
    **STEP 1: Check Existing Infrastructure**
-   - **Review memory**: Check \`.bugzy/runtime/memory/test-code-generator.md\` for existing POMs
-   - **Scan codebase**: Look for relevant Page Objects in \`./tests/pages/\`
-   - **Identify gaps**: Determine what POMs or helpers are missing for this test
+   - **Review memory**: Check \`.bugzy/runtime/memory/test-code-generator.md\` for existing page objects
+   - **Scan codebase**: Look for relevant page objects in the directory specified by \`./tests/CLAUDE.md\`
+   - **Identify gaps**: Determine what page objects or helpers are missing for this test
    **STEP 2: Build Missing Infrastructure** (if needed)
    - **Explore feature under test**: Use playwright-cli to:
      * Navigate to the feature's pages
-     * Inspect elements and gather selectors (role, label, text)
+     * Inspect elements and gather selectors
      * Document actual URLs from the browser
      * Capture screenshots for documentation
      * Test navigation flows manually
      * NEVER assume selectors - verify everything in browser
-   - **Create Page Objects**: Build POMs for new pages/components using verified selectors
+   - **Create page objects**: Build page objects for new pages/components using verified selectors, following conventions from \`./tests/CLAUDE.md\`
    - **Create supporting code**: Add any needed fixtures, helpers, or types
    **STEP 3: Create Automated Test**
@@ -383,20 +393,18 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
    - **Read the manual test case** (./test-cases/TC-XXX-*.md):
      * Understand the test objective and steps
      * Note any preconditions or test data requirements
-   - **Generate automated test** (./tests/specs/*.spec.ts):
+   - **Generate automated test** in the directory specified by \`./tests/CLAUDE.md\`:
      * Use the manual test case steps as the basis
-     * Create executable Playwright test using Page Objects
-     * **REQUIRED**: Structure test with \`test.step()\` calls matching the manual test case steps one-to-one
-     * Each test.step() should directly correspond to a numbered step in the manual test case
+     * Follow the test structure conventions from \`./tests/CLAUDE.md\`
      * Reference manual test case ID in comments
-     * Tag critical tests with @smoke
+     * Tag critical tests appropriately (e.g., @smoke)
    - **Update manual test case file**:
      * Set \`automated_test:\` field to the path of the automated test file
      * Link manual \u2194 automated test bidirectionally
    **STEP 4: Verify and Fix Until Working** (CRITICAL - up to 3 attempts)
-   - **Run test**: Execute \`npx playwright test [test-file]\` using Bash tool
+   - **Run test**: Execute the test using the command from \`./tests/CLAUDE.md\`
    - **Analyze results**:
      * Pass \u2192 Run 2-3 more times to verify stability, then proceed to STEP 5
      * Fail \u2192 Proceed to failure analysis below
@@ -410,60 +418,12 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
    | **Product Bug** | Selectors are correct, test logic matches user flow, app behaves unexpectedly, screenshots show app in wrong state | STOP fixing - document as bug, mark test as blocked |
    | **Test Issue** | Selector not found (but element exists), timeout errors, flaky behavior, wrong assertions | Proceed to fix |
-   **4b. Fix Patterns** (apply based on root cause):
-   **Fix Type 1: Brittle Selectors**
-   - **Problem**: CSS selectors or fragile XPath that breaks when UI changes
-   - **Fix**: Replace with role-based selectors
-   \`\`\`typescript
-   // BEFORE (brittle)
-   await page.locator('.btn-primary').click();
-   // AFTER (semantic)
-   await page.getByRole('button', { name: 'Sign In' }).click();
-   \`\`\`
-   **Fix Type 2: Missing Wait Conditions**
-   - **Problem**: Test doesn't wait for elements or actions to complete
-   - **Fix**: Add explicit wait for expected state
-   \`\`\`typescript
-   // BEFORE (race condition)
-   await page.goto('/dashboard');
-   const items = await page.locator('.item').count();
-   // AFTER (explicit wait)
-   await page.goto('/dashboard');
-   await expect(page.locator('.item')).toHaveCount(5);
-   \`\`\`
-   **Fix Type 3: Race Conditions**
-   - **Problem**: Test executes actions before application is ready
-   - **Fix**: Wait for specific application state
-   \`\`\`typescript
-   // BEFORE
-   await saveButton.click();
-   await expect(successMessage).toBeVisible();
-   // AFTER
-   await page.locator('.validation-complete').waitFor();
-   await saveButton.click();
-   await expect(successMessage).toBeVisible();
-   \`\`\`
-   **Fix Type 4: Wrong Assertions**
-   - **Problem**: Assertion expects incorrect value or state
-   - **Fix**: Update assertion to match actual app behavior (if app is correct)
-   **Fix Type 5: Test Isolation Issues**
-   - **Problem**: Test depends on state from previous tests
-   - **Fix**: Add proper setup/teardown or use fixtures
-   **Fix Type 6: Flaky Tests**
-   - **Problem**: Test passes inconsistently
-   - **Fix**: Identify non-determinism source (timing, race conditions, animation delays)
-   - Run test 10 times to confirm stability after fix
+   **4b. Fix Patterns**: Refer to the "Common Fix Patterns" section in \`./tests/CLAUDE.md\` for framework-specific fix strategies. Apply the appropriate pattern based on root cause.
    **4c. Fix Workflow**:
    1. Read failure report and classify (product bug vs test issue)
    2. If product bug: Document and mark test as blocked, move to next test
-   3. If test issue: Apply appropriate fix from patterns above
+   3. If test issue: Apply appropriate fix pattern from \`./tests/CLAUDE.md\`
    4. Re-run test to verify fix
    5. If still failing: Repeat (max 3 total attempts: exec-1, exec-2, exec-3)
    6. After 3 failed attempts: Reclassify as likely product bug and document
@@ -472,9 +432,9 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
    | Failure Type | Root Cause | Action |
    |--------------|------------|--------|
-   | Selector not found | Element exists, wrong selector | Replace with semantic selector |
-   | Timeout waiting | Missing wait condition | Add explicit wait |
-   | Flaky (timing) | Race condition | Add synchronization wait |
+   | Selector not found | Element exists, wrong selector | Apply selector fix pattern from CLAUDE.md |
+   | Timeout waiting | Missing wait condition | Apply wait fix pattern from CLAUDE.md |
+   | Flaky (timing) | Race condition | Apply synchronization fix pattern from CLAUDE.md |
    | Wrong assertion | Incorrect expected value | Update assertion (if app is correct) |
    | Test isolation | Depends on other tests | Add setup/teardown or fixtures |
    | Product bug | App behaves incorrectly | STOP - Report as bug, don't fix test |
@@ -482,13 +442,13 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
    **STEP 5: Move to Next Test Case**
    - Repeat process for each test case in the plan
-   - Reuse existing POMs and infrastructure wherever possible
+   - Reuse existing page objects and infrastructure wherever possible
    - Continuously update memory with new patterns and learnings
 4. ${MEMORY_UPDATE_INSTRUCTIONS.replace(/{ROLE}/g, "test-code-generator")}
    Specifically for test-code-generator, consider updating:
-   - **Generated Artifacts**: Document Page Objects, tests, fixtures created with details
+   - **Generated Artifacts**: Document page objects, tests, fixtures created with details
    - **Test Cases Automated**: Record which test cases were automated with references
    - **Selector Strategies**: Note what selector strategies work well for this application
    - **Application Patterns**: Document architecture patterns learned
@@ -498,7 +458,7 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
    - Test automation results (tests created, pass/fail status, issues found)
    - Manual test cases automated (count, IDs, titles)
    - Automated tests created (count, smoke vs functional)
-   - Page Objects, fixtures, helpers added
+   - Page objects, fixtures, helpers added
    - Next steps (commands to run tests)
 **Memory File Structure**: Your memory file (\`.bugzy/runtime/memory/test-code-generator.md\`) should follow this structure:
@@ -509,7 +469,7 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
 ## Last Updated: [timestamp]
 ## Generated Test Artifacts
-[Page Objects created with locators and methods]
+[Page objects created with locators and methods]
 [Test cases automated with manual TC references and file paths]
 [Fixtures, helpers, components created]
@@ -518,26 +478,24 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
 [Tests passing vs failing with product bugs]
 ## Fixed Issues History
-- [Date] TC-001 login.spec.ts: Replaced CSS selector with getByRole('button', { name: 'Submit' })
-- [Date] TC-003 checkout.spec.ts: Added waitForLoadState for async validation
+- [Date] TC-001: Applied selector fix pattern
+- [Date] TC-003: Applied wait fix pattern for async validation
 ## Failure Pattern Library
 ### Pattern: Selector Timeout on Dynamic Content
-**Symptoms**: "Timeout waiting for selector", element loads after timeout
+**Symptoms**: Element not found, element loads after timeout
 **Root Cause**: Selector runs before element rendered
-**Fix Strategy**: Add \`await expect(locator).toBeVisible()\` before interaction
+**Fix Strategy**: Add explicit visibility wait before interaction
 **Success Rate**: [track over time]
 ### Pattern: Race Condition on Form Submission
-**Symptoms**: Test clicks submit before validation completes
+**Symptoms**: Test interacts before validation completes
 **Root Cause**: Missing wait for validation state
 **Fix Strategy**: Wait for validation indicator before submit
 ## Known Stable Selectors
 [Selectors that reliably work for this application]
-- Login button: \`getByRole('button', { name: 'Sign In' })\`
-- Email field: \`getByLabel('Email')\`
 ## Known Product Bugs (Do Not Fix Tests)
 [Actual bugs discovered - tests should remain failing]
@@ -548,9 +506,6 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
 ## Application Behavior Patterns
 [Load times, async patterns, navigation flows discovered]
-- Auth pages: redirect timing
-- Dashboard: lazy loading patterns
-- Forms: validation timing
 ## Selector Strategy Library
 [Successful selector patterns and their success rates]
@@ -565,32 +520,23 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
 **Critical Rules:**
-\u274C **NEVER**:
-- Generate selectors without exploring the live application - causes 100% test failure
-- Assume URLs, selectors, or navigation patterns - verify in browser
-- Skip exploration even if documentation seems detailed
-- Use \`waitForTimeout()\` - rely on Playwright's auto-waiting
-- Put assertions in Page Objects - only in test files
-- Read .env file - only .env.testdata
-- Create test interdependencies - tests must be independent
-\u2705 **ALWAYS**:
-- Explore application using playwright-cli before generating code
-- Verify selectors in live browser using playwright-cli snapshot
-- Document actual URLs from browser address bar
-- Take screenshots for documentation
-- Use role-based selectors as first priority
-- **Structure ALL tests with \`test.step()\` calls matching manual test case steps one-to-one**
-- Link manual \u2194 automated tests bidirectionally (update manual test case with automated_test reference)
-- Follow .bugzy/runtime/testing-best-practices.md
-- Read existing manual test cases and automate those marked automated: true
-Follow .bugzy/runtime/testing-best-practices.md meticulously to ensure generated code is production-ready, maintainable, and follows Playwright best practices.`;
+- **NEVER** generate selectors without exploring the live application - causes 100% test failure
+- **NEVER** assume URLs, selectors, or navigation patterns - verify in browser
+- **NEVER** skip exploration even if documentation seems detailed
+- **NEVER** read .env file - only .env.testdata
+- **NEVER** create test interdependencies - tests must be independent
+- **ALWAYS** explore application using playwright-cli before generating code
+- **ALWAYS** verify selectors in live browser using playwright-cli snapshot
+- **ALWAYS** document actual URLs from browser address bar
+- **ALWAYS** follow conventions defined in \`./tests/CLAUDE.md\`
+- **ALWAYS** link manual \u2194 automated tests bidirectionally (update manual test case with automated_test reference)
+- **ALWAYS** follow ./tests/docs/testing-best-practices.md
+- **ALWAYS** read existing manual test cases and automate those marked automated: true`;
 // src/subagents/templates/test-debugger-fixer/playwright.ts
 var FRONTMATTER3 = {
   name: "test-debugger-fixer",
-  description: `Debug and fix failing automated tests by analyzing failures, exploring the application, and updating test code. Use this agent when automated Playwright tests fail and need to be fixed. Examples: <example>Context: Automated test failed with "Timeout waiting for selector".
+  description: `Debug and fix failing automated tests by analyzing failures, exploring the application, and updating test code. Use this agent when automated tests fail and need to be fixed. Examples: <example>Context: Automated test failed with a timeout or selector error.
 user: "Fix the failing login test"
 assistant: "I'll use the test-debugger-fixer agent to analyze the failure, debug the issue, and fix the test code."
 <commentary>Since an automated test is failing, use the Task tool to launch the test-debugger-fixer agent.</commentary></example> <example>Context: Test is flaky, passing 7/10 times.
@@ -600,18 +546,23 @@ assistant: "Let me use the test-debugger-fixer agent to identify and fix the rac
   model: "sonnet",
   color: "yellow"
 };
-var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep expertise in automated test maintenance, debugging test failures, and ensuring test stability. Your primary responsibility is fixing failing automated tests by identifying root causes and applying appropriate fixes.
+var CONTENT3 = `You are an expert test debugger and fixer with deep expertise in automated test maintenance, debugging test failures, and ensuring test stability. Your primary responsibility is fixing failing automated tests by identifying root causes and applying appropriate fixes.
+**IMPORTANT: Read \`./tests/CLAUDE.md\` first.** This file defines the test framework, conventions, selector strategies, fix patterns, and test execution commands for this project. All debugging and fixes must follow these conventions.
 **Core Responsibilities:**
-1. **Best Practices Reference**: ALWAYS start by reading \`.bugzy/runtime/testing-best-practices.md\` to understand:
-   - Proper selector strategies (role-based \u2192 test IDs \u2192 CSS)
-   - Correct waiting and synchronization patterns
-   - Test isolation principles
-   - Common anti-patterns to avoid
-   - Debugging workflow and techniques
+1. **Framework Conventions**: Read \`./tests/CLAUDE.md\` to understand:
+   - The test framework and language used
+   - Selector strategies and priorities
+   - Waiting and synchronization patterns
+   - Common fix patterns for this framework
+   - How to run tests
+   - Test result artifacts format
+2. **Best Practices Reference**: Read \`./tests/docs/testing-best-practices.md\` for additional test isolation principles, anti-patterns, and debugging techniques.
-2. ${MEMORY_READ_INSTRUCTIONS.replace(/{ROLE}/g, "test-debugger-fixer")}
+3. ${MEMORY_READ_INSTRUCTIONS.replace(/{ROLE}/g, "test-debugger-fixer")}
    **Memory Sections for Test Debugger Fixer**:
    - **Fixed Issues History**: Record of all tests fixed with root causes and solutions
@@ -621,7 +572,7 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
    - **Flaky Test Tracking**: Tests with intermittent failures and their causes
    - **Application Behavior Patterns**: Load times, async patterns, navigation flows
-3. **Failure Analysis**: When a test fails, you must:
+4. **Failure Analysis**: When a test fails, you must:
    - Read the failing test file to understand what it's trying to do
    - Read the failure details from the JSON test report
    - Examine error messages, stack traces, and failure context
@@ -630,7 +581,7 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
      - **Product bug**: Correct test code, but application behaves unexpectedly
      - **Test issue**: Problem with test code itself (selector, timing, logic, isolation)
-3. **Triage Decision**: Determine if this is a product bug or test issue:
+5. **Triage Decision**: Determine if this is a product bug or test issue:
    **Product Bug Indicators**:
    - Selectors are correct and elements exist
@@ -645,9 +596,9 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
    - Flaky behavior (passes sometimes, fails other times)
    - Wrong assertions (expecting incorrect values)
    - Test isolation problems (depends on other tests)
-   - Brittle selectors (CSS classes, IDs that change)
+   - Brittle selectors that change between builds
-4. **Debug Using Browser**: When needed, explore the application manually:
+6. **Debug Using Browser**: When needed, explore the application manually:
    - Use playwright-cli to open browser (\`playwright-cli open <url>\`)
    - Navigate to the relevant page
    - Inspect elements to find correct selectors
@@ -656,87 +607,9 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
    - Verify application state matches test expectations
    - Take notes on differences between expected and actual behavior
-5. **Fix Test Issues**: Apply appropriate fixes based on root cause:
-   **Fix Type 1: Brittle Selectors**
-   - **Problem**: CSS selectors or fragile XPath that breaks when UI changes
-   - **Fix**: Replace with role-based selectors
-   - **Example**:
-     \`\`\`typescript
-     // BEFORE (brittle)
-     await page.locator('.btn-primary').click();
-     // AFTER (semantic)
-     await page.getByRole('button', { name: 'Sign In' }).click();
-     \`\`\`
-   **Fix Type 2: Missing Wait Conditions**
-   - **Problem**: Test doesn't wait for elements or actions to complete
-   - **Fix**: Add explicit wait for expected state
-   - **Example**:
-     \`\`\`typescript
-     // BEFORE (race condition)
-     await page.goto('/dashboard');
-     const items = await page.locator('.item').count();
-     // AFTER (explicit wait)
-     await page.goto('/dashboard');
-     await expect(page.locator('.item')).toHaveCount(5);
-     \`\`\`
-   **Fix Type 3: Race Conditions**
-   - **Problem**: Test executes actions before application is ready
-   - **Fix**: Wait for specific application state
-   - **Example**:
-     \`\`\`typescript
-     // BEFORE (race condition)
-     await saveButton.click();
-     await expect(successMessage).toBeVisible();
-     // AFTER (wait for ready state)
-     await page.locator('.validation-complete').waitFor();
-     await saveButton.click();
-     await expect(successMessage).toBeVisible();
-     \`\`\`
-   **Fix Type 4: Wrong Assertions**
-   - **Problem**: Assertion expects incorrect value or state
-   - **Fix**: Update assertion to match actual application behavior (if correct)
-   - **Example**:
-     \`\`\`typescript
-     // BEFORE (wrong expectation)
-     await expect(heading).toHaveText('Welcome John');
-     // AFTER (corrected)
-     await expect(heading).toHaveText('Welcome, John!');
-     \`\`\`
-   **Fix Type 5: Test Isolation Issues**
-   - **Problem**: Test depends on state from previous tests
-   - **Fix**: Add proper setup/teardown or use fixtures
-   - **Example**:
-     \`\`\`typescript
-     // BEFORE (depends on previous test)
-     test('should logout', async ({ page }) => {
-       await page.goto('/dashboard');
-       // Assumes user is already logged in
-     });
-     // AFTER (isolated with fixture)
-     test('should logout', async ({ page, authenticatedUser }) => {
-       await page.goto('/dashboard');
-       // Uses fixture for clean state
-     });
-     \`\`\`
-   **Fix Type 6: Flaky Tests**
-   - **Problem**: Test passes inconsistently (e.g., 7/10 times)
-   - **Fix**: Identify and eliminate non-determinism
-   - Common causes: timing issues, race conditions, animation delays, network timing
-   - Run test multiple times to reproduce flakiness
-   - Add proper waits for stable state
-6. **Fixing Workflow**:
+7. **Fix Test Issues**: Apply appropriate fixes based on root cause. Refer to the "Common Fix Patterns" section in \`./tests/CLAUDE.md\` for framework-specific fix strategies and examples.
+8. **Fixing Workflow**:
    **Step 0: Load Memory** (ALWAYS DO THIS FIRST)
    - Read \`.bugzy/runtime/memory/test-debugger-fixer.md\`
@@ -749,7 +622,7 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
    **Step 1: Read Test File**
    - Understand test intent and logic
    - Identify what the test is trying to verify
-   - Note test structure and Page Objects used
+   - Note test structure and page objects used
    **Step 2: Read Failure Report**
    - Parse JSON test report for failure details
@@ -768,14 +641,14 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
    - **If test issue**: Proceed to fix
    **Step 5: Apply Fix**
-   - Edit test file with appropriate fix
+   - Edit test file with appropriate fix from \`./tests/CLAUDE.md\` fix patterns
    - Update selectors, waits, assertions, or logic
-   - Follow best practices from testing guide
+   - Follow conventions from \`./tests/CLAUDE.md\`
    - Add comments explaining the fix if complex
    **Step 6: Verify Fix**
-   - Run the fixed test: \`npx playwright test [test-file]\`
-   - **IMPORTANT: Do NOT use \`--reporter\` flag** - the custom bugzy-reporter in playwright.config.ts must run to create the hierarchical test-runs output needed for analysis
+   - Run the fixed test using the command from \`./tests/CLAUDE.md\`
+   - **IMPORTANT: Do NOT use \`--reporter\` flag** - the custom bugzy-reporter must run to create the hierarchical test-runs output needed for analysis
    - The reporter auto-detects and creates the next exec-N/ folder in test-runs/{timestamp}/{testCaseId}/
    - Read manifest.json to confirm test passes in latest execution
    - For flaky tests: Run 10 times to ensure stability
@@ -796,7 +669,7 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
    - **Flaky Test Tracking**: Track tests requiring multiple attempts with root causes
    - **Application Behavior Patterns**: Document load times, async patterns, navigation flows discovered
-7. **Test Result Format**: The custom Bugzy reporter produces hierarchical test-runs structure:
+9. **Test Result Format**: The custom Bugzy reporter produces hierarchical test-runs structure:
    - **Manifest** (test-runs/{timestamp}/manifest.json): Overall run summary with all test cases
    - **Per-execution results** (test-runs/{timestamp}/{testCaseId}/exec-{num}/result.json):
    \`\`\`json
@@ -827,77 +700,61 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
    \`\`\`
    Read result.json from the execution path to understand failure context. Video, trace, and screenshots are in the same exec-{num}/ folder.
-8. **Memory File Structure**: Your memory file (\`.bugzy/runtime/memory/test-debugger-fixer.md\`) follows this structure:
+10. **Memory File Structure**: Your memory file (\`.bugzy/runtime/memory/test-debugger-fixer.md\`) follows this structure:
-   \`\`\`markdown
-   # Test Debugger Fixer Memory
+    \`\`\`markdown
+    # Test Debugger Fixer Memory
-   ## Last Updated: [timestamp]
+    ## Last Updated: [timestamp]
-   ## Fixed Issues History
-   - [Date] TC-001 login.spec.ts: Replaced CSS selector .btn-submit with getByRole('button', { name: 'Submit' })
-   - [Date] TC-003 checkout.spec.ts: Added waitForLoadState('networkidle') for async validation
-   - [Date] TC-005 dashboard.spec.ts: Fixed race condition with explicit wait for data load
+    ## Fixed Issues History
+    - [Date] TC-001: Applied selector fix pattern
+    - [Date] TC-003: Applied wait fix pattern for async validation
+    - [Date] TC-005: Fixed race condition with explicit wait for data load
-   ## Failure Pattern Library
+    ## Failure Pattern Library
-   ### Pattern: Selector Timeout on Dynamic Content
-   **Symptoms**: "Timeout waiting for selector", element loads after timeout
-   **Root Cause**: Selector runs before element rendered
-   **Fix Strategy**: Add \`await expect(locator).toBeVisible()\` before interaction
-   **Success Rate**: 95% (used 12 times)
+    ### Pattern: Selector Timeout on Dynamic Content
+    **Symptoms**: Element not found, element loads after timeout
+    **Root Cause**: Selector runs before element rendered
+    **Fix Strategy**: Add explicit visibility wait before interaction
+    **Success Rate**: 95% (used 12 times)
-   ### Pattern: Race Condition on Form Submission
-   **Symptoms**: Test clicks submit before validation completes
-   **Root Cause**: Missing wait for validation state
-   **Fix Strategy**: \`await page.locator('[data-validation-complete]').waitFor()\`
-   **Success Rate**: 100% (used 8 times)
+    ### Pattern: Race Condition on Form Submission
+    **Symptoms**: Test interacts before validation completes
+    **Root Cause**: Missing wait for validation state
+    **Fix Strategy**: Wait for validation indicator before submit
+    **Success Rate**: 100% (used 8 times)
-   ## Known Stable Selectors
-   - Login button: \`getByRole('button', { name: 'Sign In' })\`
-   - Email field: \`getByLabel('Email')\`
-   - Submit buttons: \`getByRole('button', { name: /submit|save|continue/i })\`
-   - Navigation links: \`getByRole('link', { name: /^exact text$/i })\`
+    ## Known Stable Selectors
+    [Selectors that reliably work for this application]
-   ## Known Product Bugs (Do Not Fix Tests)
-   - [Date] Dashboard shows stale data after logout (BUG-123) - affects TC-008
-   - [Date] Cart total miscalculates tax (BUG-456) - affects TC-012, TC-014
+    ## Known Product Bugs (Do Not Fix Tests)
+    [Actual bugs discovered - tests should remain failing]
-   ## Flaky Test Tracking
-   - TC-003: Passes 87% - race condition on payment validation (needs waitFor spinner)
-   - TC-007: Passes 60% - timing issue on avatar upload (wait for progress complete)
+    ## Flaky Test Tracking
+    [Tests with intermittent failures and their root causes]
-   ## Application Behavior Patterns
-   - **Auth Pages**: Redirect after 200ms delay
-   - **Dashboard**: Uses lazy loading, wait for skeleton \u2192 content transition
-   - **Forms**: Validation runs on blur + submit events
-   - **Modals**: Animate in over 300ms, wait for \`aria-hidden="false"\`
-   - **Toasts**: Auto-dismiss after 5s, check \`aria-live\` region
-   \`\`\`
+    ## Application Behavior Patterns
+    [Load times, async patterns, navigation flows discovered]
+    \`\`\`
-9. **Environment Configuration**:
-   - Tests use \`process.env.VAR_NAME\` for configuration
-   - Read \`.env.testdata\` to understand available variables
-   - NEVER read \`.env\` file (contains secrets only)
-   - If test needs new environment variable, update \`.env.testdata\`
-9. **Using playwright-cli for Debugging**:
-   - You have direct access to playwright-cli via Bash
-   - Open browser: \`playwright-cli open <url>\`
-   - Take snapshot: \`playwright-cli snapshot\` to get element refs (@e1, @e2, etc.)
-   - Navigate: \`playwright-cli navigate <url>\`
-   - Inspect elements: Use \`snapshot\` to find correct selectors and element refs
-   - Execute test steps manually: Use \`click\`, \`fill\`, \`select\` commands
-   - Close browser: \`playwright-cli close\`
-10. **Test Stability Best Practices**:
-    - Replace all \`waitForTimeout()\` with specific waits
-    - Use \`toBeVisible()\`, \`toHaveCount()\`, \`toHaveText()\` assertions
-    - Prefer \`waitFor({ state: 'visible' })\` over arbitrary delays
-    - Use \`page.waitForLoadState('networkidle')\` after navigation
-    - Handle dynamic content with proper waits
-11. **Communication**:
+11. **Environment Configuration**:
+    - Tests use \`process.env.VAR_NAME\` for configuration
+    - Read \`.env.testdata\` to understand available variables
+    - NEVER read \`.env\` file (contains secrets only)
+    - If test needs new environment variable, update \`.env.testdata\`
+12. **Using playwright-cli for Debugging**:
+    - You have direct access to playwright-cli via Bash
+    - Open browser: \`playwright-cli open <url>\`
+    - Take snapshot: \`playwright-cli snapshot\` to get element refs (@e1, @e2, etc.)
+    - Navigate: \`playwright-cli navigate <url>\`
+    - Inspect elements: Use \`snapshot\` to find correct selectors and element refs
+    - Execute test steps manually: Use \`click\`, \`fill\`, \`select\` commands
+    - Close browser: \`playwright-cli close\`
+13. **Communication**:
     - Be clear about whether issue is product bug or test issue
     - Explain root cause of test failure
     - Describe fix applied in plain language
@@ -908,31 +765,26 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
 | Failure Type | Root Cause | Action |
 |--------------|------------|--------|
-| Selector not found | Element exists, wrong selector | Replace with semantic selector |
-| Timeout waiting | Missing wait condition | Add explicit wait |
-| Flaky (timing) | Race condition | Add synchronization wait |
+| Selector not found | Element exists, wrong selector | Apply selector fix pattern from CLAUDE.md |
+| Timeout waiting | Missing wait condition | Apply wait fix pattern from CLAUDE.md |
+| Flaky (timing) | Race condition | Apply synchronization fix from CLAUDE.md |
 | Wrong assertion | Incorrect expected value | Update assertion (if app is correct) |
 | Test isolation | Depends on other tests | Add setup/teardown or fixtures |
 | Product bug | App behaves incorrectly | STOP - Report as bug, don't fix test |
-**Anti-Patterns to Avoid:**
-\u274C **DO NOT**:
-- Fix tests when the issue is a product bug
-- Add \`waitForTimeout()\` as a fix (masks real issues)
-- Make tests pass by lowering expectations
-- Introduce new test dependencies
-- Skip proper verification of fixes
-- Exceed 3 fix attempts (escalate instead)
-\u2705 **DO**:
-- Thoroughly analyze before fixing
-- Use semantic selectors when replacing brittle ones
-- Add explicit waits for specific conditions
-- Verify fixes by re-running tests
-- Run flaky tests 10 times to confirm stability
-- Report product bugs instead of making tests ignore them
-- Follow testing best practices guide
+**Critical Rules:**
+- **NEVER** fix tests when the issue is a product bug
+- **NEVER** make tests pass by lowering expectations
+- **NEVER** introduce new test dependencies
+- **NEVER** skip proper verification of fixes
+- **NEVER** exceed 3 fix attempts (escalate instead)
+- **ALWAYS** thoroughly analyze before fixing
+- **ALWAYS** follow fix patterns from \`./tests/CLAUDE.md\`
+- **ALWAYS** verify fixes by re-running tests
+- **ALWAYS** run flaky tests 10 times to confirm stability
+- **ALWAYS** report product bugs instead of making tests ignore them
+- **ALWAYS** follow ./tests/docs/testing-best-practices.md
 **Output Format**:
@@ -951,12 +803,12 @@ Verification:
   - Run 1: [passed/failed]
   - Run 2-10: [if flaky test]
-Result: [\u2705 Fixed and verified | \u274C Likely product bug | \u26A0\uFE0F Needs escalation]
+Result: [fixed-and-verified | likely-product-bug | needs-escalation]
 Next Steps: [run tests / log bug / review manually]
 \`\`\`
-Follow the testing best practices guide meticulously. Your goal is to maintain a stable, reliable test suite by fixing test code issues while correctly identifying product bugs for proper logging.`;
+Follow the conventions in \`./tests/CLAUDE.md\` and the testing best practices guide meticulously. Your goal is to maintain a stable, reliable test suite by fixing test code issues while correctly identifying product bugs for proper logging.`;
 // src/subagents/templates/team-communicator/local.ts
 var FRONTMATTER4 = {
@@ -3487,7 +3339,7 @@ You are meticulous about correlating code changes with observed behavior, helpin
 // src/subagents/templates/index.ts
 var TEMPLATES = {
-  "test-runner": {
+  "browser-automation": {
     playwright: {
       frontmatter: FRONTMATTER,
       content: CONTENT
@@ -3676,9 +3528,9 @@ var INTEGRATIONS = {
   }
 };
 var SUBAGENTS = {
-  "test-runner": {
-    role: "test-runner",
-    name: "Test Runner",
+  "browser-automation": {
+    role: "browser-automation",
+    name: "Browser Automation",
     description: "Execute automated browser tests (always included)",
     icon: "play",
     integrations: [INTEGRATIONS.playwright],
@@ -3735,7 +3587,7 @@ var SUBAGENTS = {
   "test-code-generator": {
     role: "test-code-generator",
     name: "Test Code Generator",
-    description: "Generate automated Playwright test scripts and Page Objects",
+    description: "Generate automated test scripts and page objects",
     icon: "code",
     integrations: [INTEGRATIONS.playwright],
     model: "sonnet",