@bugzy-ai/bugzy 1.13.0 → 1.14.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/cli/index.cjs +339 -253
- package/dist/cli/index.cjs.map +1 -1
- package/dist/cli/index.js +339 -253
- package/dist/cli/index.js.map +1 -1
- package/dist/index.cjs +138 -57
- package/dist/index.cjs.map +1 -1
- package/dist/index.js +138 -57
- package/dist/index.js.map +1 -1
- package/dist/subagents/index.cjs +44 -27
- package/dist/subagents/index.cjs.map +1 -1
- package/dist/subagents/index.js +44 -27
- package/dist/subagents/index.js.map +1 -1
- package/dist/subagents/metadata.cjs +1 -1
- package/dist/subagents/metadata.cjs.map +1 -1
- package/dist/subagents/metadata.js +1 -1
- package/dist/subagents/metadata.js.map +1 -1
- package/dist/tasks/index.cjs +38 -0
- package/dist/tasks/index.cjs.map +1 -1
- package/dist/tasks/index.js +38 -0
- package/dist/tasks/index.js.map +1 -1
- package/package.json +1 -1
- package/templates/init/.bugzy/runtime/testing-best-practices.md +1 -1
- package/templates/init/AGENTS.md +1 -1
- package/templates/init/CLAUDE.md +1 -1
package/dist/index.cjs
CHANGED
|
@@ -90,31 +90,6 @@ var MCP_SERVERS = {
|
|
|
90
90
|
}
|
|
91
91
|
}
|
|
92
92
|
},
|
|
93
|
-
playwright: {
|
|
94
|
-
provider: "playwright",
|
|
95
|
-
name: "Playwright",
|
|
96
|
-
description: "Playwright MCP server for browser automation",
|
|
97
|
-
requiresCredentials: false,
|
|
98
|
-
npmPackages: ["@playwright/mcp"],
|
|
99
|
-
config: {
|
|
100
|
-
command: "playwright-mcp",
|
|
101
|
-
args: [
|
|
102
|
-
"--browser",
|
|
103
|
-
"chromium",
|
|
104
|
-
"--secrets",
|
|
105
|
-
".env",
|
|
106
|
-
"--no-sandbox",
|
|
107
|
-
"--viewport-size",
|
|
108
|
-
"1280x720"
|
|
109
|
-
]
|
|
110
|
-
},
|
|
111
|
-
containerExtensions: {
|
|
112
|
-
args: ["--headless"],
|
|
113
|
-
env: {
|
|
114
|
-
PLAYWRIGHT_BROWSERS_PATH: "/opt/ms-playwright"
|
|
115
|
-
}
|
|
116
|
-
}
|
|
117
|
-
},
|
|
118
93
|
notion: {
|
|
119
94
|
provider: "notion",
|
|
120
95
|
name: "Notion",
|
|
@@ -473,6 +448,9 @@ Before invoking the agent, identify the test cases for the current area:
|
|
|
473
448
|
- Existing automated tests: ./tests/specs/
|
|
474
449
|
- Existing Page Objects: ./tests/pages/
|
|
475
450
|
|
|
451
|
+
**Knowledge Base Patterns (MUST APPLY):**
|
|
452
|
+
Include ALL relevant testing patterns from the knowledge base that apply to this area. For example, if the KB documents timing behaviors (animation delays, loading states), selector gotchas, or recommended assertion approaches \u2014 list them here explicitly and instruct the agent to use the specific patterns described (e.g., specific assertion methods with specific timeouts). The test-code-generator does not have access to the knowledge base, so you MUST relay the exact patterns and recommended code approaches.
|
|
453
|
+
|
|
476
454
|
**The agent should:**
|
|
477
455
|
1. Read the manual test case files for this area
|
|
478
456
|
2. Check existing Page Object infrastructure for this area
|
|
@@ -481,6 +459,7 @@ Before invoking the agent, identify the test cases for the current area:
|
|
|
481
459
|
5. For each test case marked \`automated: true\`:
|
|
482
460
|
- Create automated Playwright test in ./tests/specs/
|
|
483
461
|
- Update the manual test case file to reference the automated test path
|
|
462
|
+
- Apply ALL knowledge base patterns listed above (timing, selectors, assertions)
|
|
484
463
|
6. Run and iterate on each test until it passes or fails with a product bug
|
|
485
464
|
7. Update .env.testdata with any new variables
|
|
486
465
|
|
|
@@ -1661,6 +1640,40 @@ The input format determines the trigger source and context extraction strategy.`
|
|
|
1661
1640
|
Store the detected trigger for use in output routing:
|
|
1662
1641
|
- Set variable: \`TRIGGER_SOURCE\` = [GITHUB_PR | SLACK_MESSAGE | CI_CD | MANUAL]
|
|
1663
1642
|
- This determines output formatting and delivery channel`
|
|
1643
|
+
},
|
|
1644
|
+
// Step 5c: Coverage Gap vs. Ambiguity (inline)
|
|
1645
|
+
{
|
|
1646
|
+
inline: true,
|
|
1647
|
+
title: "Coverage Gap vs. Ambiguity",
|
|
1648
|
+
content: `### Coverage Gap vs. Ambiguity
|
|
1649
|
+
|
|
1650
|
+
When the trigger indicates a feature has been implemented and is ready for testing (Jira "Ready to Test", PR merged, CI/CD pipeline):
|
|
1651
|
+
|
|
1652
|
+
**Missing test coverage for the referenced feature is a COVERAGE GAP, not an ambiguity.**
|
|
1653
|
+
|
|
1654
|
+
- The developer/team is asserting the feature exists and is ready for testing
|
|
1655
|
+
- "Not yet explored" or "out of scope" in the test plan means the QA team hasn't tested it yet \u2014 it does NOT mean the feature doesn't exist
|
|
1656
|
+
- Do NOT classify as CRITICAL based on stale documentation or knowledge base gaps
|
|
1657
|
+
- If project-context.md or the Jira issue references the feature, assume it exists until browser exploration proves otherwise
|
|
1658
|
+
- Coverage gaps are handled in the "Create Tests for Coverage Gaps" step below \u2014 do NOT block here
|
|
1659
|
+
|
|
1660
|
+
### If You Browse the App and Cannot Find the Referenced Feature
|
|
1661
|
+
|
|
1662
|
+
Apply the Clarification Protocol's **"Execution Obstacle vs. Requirement Ambiguity"** principle:
|
|
1663
|
+
|
|
1664
|
+
This is an **execution obstacle**, NOT a requirement ambiguity \u2014 because the authoritative trigger source (Jira issue, PR, team request) asserts the feature exists. Common causes for not finding it:
|
|
1665
|
+
- **Missing role/tier**: You're logged in as a basic user but the feature requires admin/premium access
|
|
1666
|
+
- **Missing test data**: Required test accounts or data haven't been configured in \`.env.testdata\`
|
|
1667
|
+
- **Feature flags**: The feature is behind a flag not enabled in the test environment
|
|
1668
|
+
- **Environment config**: The feature requires specific environment variables or deployment settings
|
|
1669
|
+
|
|
1670
|
+
**Action: PROCEED to "Create Tests for Coverage Gaps".** Do NOT BLOCK.
|
|
1671
|
+
- Create test cases and specs that reference the feature as described in the trigger
|
|
1672
|
+
- Add placeholder env vars to \`.env.testdata\` for any missing credentials
|
|
1673
|
+
- Notify the team (via team-communicator) about the access obstacle and what needs to be configured
|
|
1674
|
+
- Tests may fail until the obstacle is resolved \u2014 this is expected and acceptable
|
|
1675
|
+
|
|
1676
|
+
**Only classify as CRITICAL (and BLOCK) if NO authoritative trigger source claims the feature exists** \u2014 e.g., a vague manual request with no Jira/PR backing.`
|
|
1664
1677
|
},
|
|
1665
1678
|
// Step 6: Clarification Protocol (library)
|
|
1666
1679
|
"clarification-protocol",
|
|
@@ -2338,7 +2351,7 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
|
|
|
2338
2351
|
|
|
2339
2352
|
3. **Environment Setup**: Before test execution:
|
|
2340
2353
|
- Read \`.env.testdata\` to get non-secret environment variable values (TEST_BASE_URL, TEST_OWNER_EMAIL, etc.)
|
|
2341
|
-
- For secrets, variable names
|
|
2354
|
+
- For secrets, variable names are available as environment variables (playwright-cli inherits the process environment)
|
|
2342
2355
|
|
|
2343
2356
|
4. **Test Case Parsing**: You will receive a test case file path. Parse the test case to extract:
|
|
2344
2357
|
- Test steps and actions to perform
|
|
@@ -2346,16 +2359,16 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
|
|
|
2346
2359
|
- Test data and input values (replace any \${TEST_*} or $TEST_* variables with actual values from .env)
|
|
2347
2360
|
- Preconditions and setup requirements
|
|
2348
2361
|
|
|
2349
|
-
5. **Browser Automation Execution**: Using
|
|
2350
|
-
- Launch a browser
|
|
2351
|
-
- Execute each test step sequentially
|
|
2362
|
+
5. **Browser Automation Execution**: Using playwright-cli (CLI-based browser automation):
|
|
2363
|
+
- Launch a browser: \`playwright-cli open <url>\`
|
|
2364
|
+
- Execute each test step sequentially using CLI commands: \`click\`, \`fill\`, \`select\`, \`hover\`, etc.
|
|
2365
|
+
- Use \`snapshot\` to inspect page state and find element references (@e1, @e2, etc.)
|
|
2352
2366
|
- Handle dynamic waits and element interactions intelligently
|
|
2353
2367
|
- Manage browser state between steps
|
|
2354
2368
|
- **IMPORTANT - Environment Variable Handling**:
|
|
2355
2369
|
- When test cases contain environment variables:
|
|
2356
2370
|
- For non-secrets (TEST_BASE_URL, TEST_OWNER_EMAIL): Read actual values from .env.testdata and use them directly
|
|
2357
|
-
- For secrets (TEST_OWNER_PASSWORD, API keys):
|
|
2358
|
-
- Playwright MCP automatically reads .env for secrets and injects them at runtime
|
|
2371
|
+
- For secrets (TEST_OWNER_PASSWORD, API keys): playwright-cli inherits environment variables from the process
|
|
2359
2372
|
- Example: Test says "Navigate to TEST_BASE_URL/login" \u2192 Read TEST_BASE_URL from .env.testdata, use the actual URL
|
|
2360
2373
|
|
|
2361
2374
|
6. **Evidence Collection at Each Step**:
|
|
@@ -2380,7 +2393,7 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
|
|
|
2380
2393
|
- \`steps.json\`: Structured steps with timestamps, video time synchronization, and detailed descriptions (see schema)
|
|
2381
2394
|
|
|
2382
2395
|
Video handling:
|
|
2383
|
-
-
|
|
2396
|
+
- Videos are automatically saved to \`.playwright-mcp/\` folder via PLAYWRIGHT_MCP_SAVE_VIDEO env var
|
|
2384
2397
|
- Find the latest video: \`ls -t .playwright-mcp/*.webm 2>/dev/null | head -1\`
|
|
2385
2398
|
- Store ONLY the filename in summary.json: \`{ "video": { "filename": "basename.webm" } }\`
|
|
2386
2399
|
- Do NOT copy, move, or delete video files - external service handles uploads
|
|
@@ -2419,8 +2432,7 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
|
|
|
2419
2432
|
- Identify all TEST_* variable references (e.g., TEST_BASE_URL, TEST_OWNER_EMAIL, TEST_OWNER_PASSWORD)
|
|
2420
2433
|
- Read .env.testdata to get actual values for non-secret variables
|
|
2421
2434
|
- For non-secrets (TEST_BASE_URL, TEST_OWNER_EMAIL, etc.): Use actual values from .env.testdata directly in test execution
|
|
2422
|
-
- For secrets (TEST_OWNER_PASSWORD, API keys, etc.):
|
|
2423
|
-
- Playwright MCP will read .env and inject secret values during browser automation
|
|
2435
|
+
- For secrets (TEST_OWNER_PASSWORD, API keys, etc.): playwright-cli inherits env vars from the process environment
|
|
2424
2436
|
- If a required variable is not found in .env.testdata, log a warning but continue
|
|
2425
2437
|
|
|
2426
2438
|
5. Extract execution ID from the execution environment:
|
|
@@ -2434,7 +2446,7 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
|
|
|
2434
2446
|
- Describe what action will be performed (communicate to user)
|
|
2435
2447
|
- Log the step being executed with timestamp
|
|
2436
2448
|
- Calculate elapsed time from test start (for videoTimeSeconds)
|
|
2437
|
-
- Execute the action using
|
|
2449
|
+
- Execute the action using playwright-cli commands (click, fill, select, etc. with element refs)
|
|
2438
2450
|
- Wait for page stability
|
|
2439
2451
|
- Validate expected behavior
|
|
2440
2452
|
- Record findings and actual behavior
|
|
@@ -2509,12 +2521,11 @@ var CONTENT = `You are an expert automated test execution specialist with deep e
|
|
|
2509
2521
|
**Environment Variable Handling:**
|
|
2510
2522
|
- Read .env.testdata at the start of execution to get non-secret environment variables
|
|
2511
2523
|
- For non-secrets (TEST_BASE_URL, TEST_OWNER_EMAIL, etc.): Use actual values from .env.testdata directly
|
|
2512
|
-
- For secrets (TEST_OWNER_PASSWORD, API keys):
|
|
2513
|
-
- Playwright MCP reads .env for secrets and injects them during browser automation
|
|
2524
|
+
- For secrets (TEST_OWNER_PASSWORD, API keys): playwright-cli inherits env vars from the process environment
|
|
2514
2525
|
- DO NOT read .env yourself (security policy - it contains only secrets)
|
|
2515
2526
|
- DO NOT make up fake values or fallbacks
|
|
2516
2527
|
- If a variable is missing from .env.testdata, log a warning
|
|
2517
|
-
- If
|
|
2528
|
+
- If a secret env var is missing/empty, that indicates .env is misconfigured
|
|
2518
2529
|
- Document which environment variables were used in the test run summary
|
|
2519
2530
|
|
|
2520
2531
|
When you encounter ambiguous test steps, make intelligent decisions based on common testing patterns and document your interpretation. Always prioritize capturing evidence over speed of execution. Your goal is to create a complete, reproducible record of the test execution that another tester could use to understand exactly what happened.`;
|
|
@@ -2561,7 +2572,7 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
|
|
|
2561
2572
|
- Update the manual test case file with the automated_test reference
|
|
2562
2573
|
- Create supporting artifacts: Page Objects, fixtures, helpers, components, types
|
|
2563
2574
|
|
|
2564
|
-
5. **Mandatory Application Exploration**: NEVER generate Page Objects without exploring the live application first using
|
|
2575
|
+
5. **Mandatory Application Exploration**: NEVER generate Page Objects without exploring the live application first using playwright-cli:
|
|
2565
2576
|
- Navigate to pages, authenticate, inspect elements
|
|
2566
2577
|
- Capture screenshots for documentation
|
|
2567
2578
|
- Document exact role names, labels, text, URLs
|
|
@@ -2592,7 +2603,7 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
|
|
|
2592
2603
|
|
|
2593
2604
|
**STEP 2: Build Missing Infrastructure** (if needed)
|
|
2594
2605
|
|
|
2595
|
-
- **Explore feature under test**: Use
|
|
2606
|
+
- **Explore feature under test**: Use playwright-cli to:
|
|
2596
2607
|
* Navigate to the feature's pages
|
|
2597
2608
|
* Inspect elements and gather selectors (role, label, text)
|
|
2598
2609
|
* Document actual URLs from the browser
|
|
@@ -2799,8 +2810,8 @@ var CONTENT2 = `You are an expert Playwright test automation engineer specializi
|
|
|
2799
2810
|
- Create test interdependencies - tests must be independent
|
|
2800
2811
|
|
|
2801
2812
|
\u2705 **ALWAYS**:
|
|
2802
|
-
- Explore application using
|
|
2803
|
-
- Verify selectors in live browser using
|
|
2813
|
+
- Explore application using playwright-cli before generating code
|
|
2814
|
+
- Verify selectors in live browser using playwright-cli snapshot
|
|
2804
2815
|
- Document actual URLs from browser address bar
|
|
2805
2816
|
- Take screenshots for documentation
|
|
2806
2817
|
- Use role-based selectors as first priority
|
|
@@ -2872,7 +2883,7 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
|
|
|
2872
2883
|
- Brittle selectors (CSS classes, IDs that change)
|
|
2873
2884
|
|
|
2874
2885
|
4. **Debug Using Browser**: When needed, explore the application manually:
|
|
2875
|
-
- Use
|
|
2886
|
+
- Use playwright-cli to open browser (\`playwright-cli open <url>\`)
|
|
2876
2887
|
- Navigate to the relevant page
|
|
2877
2888
|
- Inspect elements to find correct selectors
|
|
2878
2889
|
- Manually perform test steps to understand actual behavior
|
|
@@ -2982,7 +2993,7 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
|
|
|
2982
2993
|
- Check for screenshot/trace file references
|
|
2983
2994
|
|
|
2984
2995
|
**Step 3: Reproduce and Debug**
|
|
2985
|
-
- Open browser via
|
|
2996
|
+
- Open browser via playwright-cli if needed (\`playwright-cli open <url>\`)
|
|
2986
2997
|
- Navigate to relevant page
|
|
2987
2998
|
- Manually execute test steps
|
|
2988
2999
|
- Identify discrepancy between test expectations and actual behavior
|
|
@@ -3105,13 +3116,14 @@ var CONTENT3 = `You are an expert Playwright test debugger and fixer with deep e
|
|
|
3105
3116
|
- NEVER read \`.env\` file (contains secrets only)
|
|
3106
3117
|
- If test needs new environment variable, update \`.env.testdata\`
|
|
3107
3118
|
|
|
3108
|
-
9. **Using
|
|
3109
|
-
- You have direct access to
|
|
3110
|
-
- Open browser:
|
|
3111
|
-
-
|
|
3112
|
-
-
|
|
3113
|
-
-
|
|
3114
|
-
-
|
|
3119
|
+
9. **Using playwright-cli for Debugging**:
|
|
3120
|
+
- You have direct access to playwright-cli via Bash
|
|
3121
|
+
- Open browser: \`playwright-cli open <url>\`
|
|
3122
|
+
- Take snapshot: \`playwright-cli snapshot\` to get element refs (@e1, @e2, etc.)
|
|
3123
|
+
- Navigate: \`playwright-cli navigate <url>\`
|
|
3124
|
+
- Inspect elements: Use \`snapshot\` to find correct selectors and element refs
|
|
3125
|
+
- Execute test steps manually: Use \`click\`, \`fill\`, \`select\` commands
|
|
3126
|
+
- Close browser: \`playwright-cli close\`
|
|
3115
3127
|
|
|
3116
3128
|
10. **Test Stability Best Practices**:
|
|
3117
3129
|
- Replace all \`waitForTimeout()\` with specific waits
|
|
@@ -3406,6 +3418,24 @@ var CONTENT5 = `You are a Team Communication Specialist who communicates like a
|
|
|
3406
3418
|
|
|
3407
3419
|
**Key Principle:** If it takes more than 30 seconds to read, it's too long.
|
|
3408
3420
|
|
|
3421
|
+
## CRITICAL: Always Post Messages
|
|
3422
|
+
|
|
3423
|
+
When you are invoked, your job is to POST a message to Slack \u2014 not just compose one.
|
|
3424
|
+
|
|
3425
|
+
**You MUST call \`slack_post_message\` or \`slack_post_rich_message\`** to deliver the message. Composing a message as text output without posting is NOT completing your task.
|
|
3426
|
+
|
|
3427
|
+
**NEVER:**
|
|
3428
|
+
- Return a draft without posting it
|
|
3429
|
+
- Ask "should I post this?" \u2014 if you were invoked, the answer is yes
|
|
3430
|
+
- Compose text and wait for approval before posting
|
|
3431
|
+
|
|
3432
|
+
**ALWAYS:**
|
|
3433
|
+
1. Identify the correct channel (from project-context.md or the invocation context)
|
|
3434
|
+
2. Compose the message following the guidelines below
|
|
3435
|
+
3. Call the Slack API tool to POST the message
|
|
3436
|
+
4. If a thread reply is needed, post main message first, then reply in thread
|
|
3437
|
+
5. Report back: channel name, message timestamp, and confirmation it was posted
|
|
3438
|
+
|
|
3409
3439
|
## Message Type Detection
|
|
3410
3440
|
|
|
3411
3441
|
Before composing, identify the message type:
|
|
@@ -5844,7 +5874,7 @@ var INTEGRATIONS = {
|
|
|
5844
5874
|
id: "playwright",
|
|
5845
5875
|
name: "Playwright",
|
|
5846
5876
|
provider: "playwright",
|
|
5847
|
-
requiredMCP
|
|
5877
|
+
// No requiredMCP — uses playwright-cli (CLI tool), not MCP server
|
|
5848
5878
|
isLocal: true,
|
|
5849
5879
|
// Playwright runs locally, no external connector needed
|
|
5850
5880
|
integrationType: "local"
|
|
@@ -6148,6 +6178,8 @@ Before proceeding, read the curated knowledge base to inform your work:
|
|
|
6148
6178
|
- Build on existing understanding
|
|
6149
6179
|
- Maintain consistency with established practices
|
|
6150
6180
|
|
|
6181
|
+
3. **Relay to subagents**: Subagents do NOT read the knowledge base directly. When delegating work, you MUST include relevant KB patterns in your delegation message \u2014 especially testing patterns (timing, selectors, assertion approaches) that affect test reliability.
|
|
6182
|
+
|
|
6151
6183
|
**Note:** The knowledge base may not exist yet or may be empty. If it doesn't exist or is empty, proceed without this context and help build it as you work.`,
|
|
6152
6184
|
tags: ["setup", "context"]
|
|
6153
6185
|
};
|
|
@@ -6294,7 +6326,9 @@ If the Clarification Protocol determined project maturity, adjust exploration de
|
|
|
6294
6326
|
- **Growing project**: Use requirement clarity as-is (standard protocol)
|
|
6295
6327
|
- **Mature project**: Trust knowledge base \u2014 can stay at suggested depth or go one level shallower if KB covers the feature
|
|
6296
6328
|
|
|
6297
|
-
**Always verify features exist before testing them.** If exploration reveals that a referenced page or feature does not exist in the application,
|
|
6329
|
+
**Always verify features exist before testing them.** If exploration reveals that a referenced page or feature does not exist in the application, apply the Clarification Protocol's "Execution Obstacle vs. Requirement Ambiguity" principle:
|
|
6330
|
+
- If an authoritative trigger source (Jira issue, PR, team request) asserts the feature exists, this is likely an **execution obstacle** (missing credentials, feature flags, environment config) \u2014 proceed with test artifact creation and notify the team about the access issue. Do NOT BLOCK.
|
|
6331
|
+
- If NO authoritative source claims the feature exists, this is **CRITICAL severity** \u2014 escalate via the Clarification Protocol regardless of maturity level. Do NOT silently adapt or work around the missing feature.
|
|
6298
6332
|
|
|
6299
6333
|
### Quick Exploration (1-2 min)
|
|
6300
6334
|
|
|
@@ -6580,11 +6614,56 @@ If ambiguity is detected, assess its severity:
|
|
|
6580
6614
|
|
|
6581
6615
|
| Severity | Characteristics | Examples | Action |
|
|
6582
6616
|
|----------|----------------|----------|--------|
|
|
6583
|
-
| **CRITICAL** | Expected behavior undefined/contradictory; test outcome unpredictable; core functionality unclear; success criteria missing; multiple interpretations = different strategies; **referenced page/feature
|
|
6617
|
+
| **CRITICAL** | Expected behavior undefined/contradictory; test outcome unpredictable; core functionality unclear; success criteria missing; multiple interpretations = different strategies; **referenced page/feature confirmed absent after browser verification AND no authoritative trigger source (Jira, PR, team request) asserts the feature exists** | "Fix the issue" (what issue?), "Improve performance" (which metrics?), "Fix sorting in todo list" (by date? priority? completion status?), "Test the Settings page" (browsed app \u2014 no Settings page exists, and no Jira/PR claims it was built) | **STOP** - You MUST ask via team-communicator before proceeding |
|
|
6584
6618
|
| **HIGH** | Core underspecified but direction clear; affects majority of scenarios; vague success criteria; assumptions risky | "Fix ordering" (sequence OR visibility?), "Add validation" (what? messages?), "Update dashboard" (which widgets?) | **STOP** - You MUST ask via team-communicator before proceeding |
|
|
6585
6619
|
| **MEDIUM** | Specific details missing; general requirements clear; affects subset of cases; reasonable low-risk assumptions possible; wrong assumption = test updates not strategy overhaul | Missing field labels, unclear error message text, undefined timeouts, button placement not specified, date formats unclear | **PROCEED** - (1) Moderate exploration, (2) Document assumptions: "Assuming X because Y", (3) Proceed with creation/execution, (4) Async clarification (team-communicator), (5) Mark [ASSUMED: description] |
|
|
6586
6620
|
| **LOW** | Minor edge cases; documentation gaps don't affect execution; optional/cosmetic elements; minimal impact | Tooltip text, optional field validation, icon choice, placeholder text, tab order | **PROCEED** - (1) Mark [TO BE CLARIFIED: description], (2) Proceed, (3) Mention in report "Minor Details", (4) No blocking/async clarification |
|
|
6587
6621
|
|
|
6622
|
+
### Execution Obstacle vs. Requirement Ambiguity
|
|
6623
|
+
|
|
6624
|
+
Before classifying something as CRITICAL, distinguish between these two fundamentally different situations:
|
|
6625
|
+
|
|
6626
|
+
**Requirement Ambiguity** = *What* to test is unclear \u2192 severity assessment applies normally
|
|
6627
|
+
- No authoritative source describes the feature
|
|
6628
|
+
- The task description is vague or contradictory
|
|
6629
|
+
- You cannot determine what "correct" behavior looks like
|
|
6630
|
+
- \u2192 Apply severity table above. CRITICAL/HIGH \u2192 BLOCK.
|
|
6631
|
+
|
|
6632
|
+
**Execution Obstacle** = *What* to test is clear, but *how* to access/verify has obstacles \u2192 NEVER BLOCK
|
|
6633
|
+
- An authoritative trigger source (Jira issue, PR, team message) asserts the feature exists
|
|
6634
|
+
- You browsed the app but couldn't find/access the feature
|
|
6635
|
+
- The obstacle is likely: wrong user role/tier, missing test data, feature flags, environment config
|
|
6636
|
+
- \u2192 PROCEED with artifact creation (test cases, test specs). Notify team about the obstacle.
|
|
6637
|
+
|
|
6638
|
+
**The key test:** Does an authoritative trigger source (Jira, PR, team request) assert the feature exists?
|
|
6639
|
+
- **YES** \u2192 It's an execution obstacle. The feature exists but you can't access it. Proceed: create test artifacts, add placeholder env vars, notify team about access issues.
|
|
6640
|
+
- **NO** \u2192 It may genuinely not exist. Apply CRITICAL severity, ask what was meant.
|
|
6641
|
+
|
|
6642
|
+
| Scenario | Trigger Says | Browser Shows | Classification | Action |
|
|
6643
|
+
|----------|-------------|---------------|----------------|--------|
|
|
6644
|
+
| Jira says "test premium dashboard", you log in as test_user and don't see it | Feature exists | Can't access | **Execution obstacle** | Create tests, notify team re: missing premium credentials |
|
|
6645
|
+
| PR says "verify new settings page", you browse and find no settings page | Feature exists | Can't find | **Execution obstacle** | Create tests, notify team re: possible feature flag/env issue |
|
|
6646
|
+
| Manual request "test the settings page", no Jira/PR, you browse and find no settings page | No source claims it | Can't find | **Requirement ambiguity (CRITICAL)** | BLOCK, ask what was meant |
|
|
6647
|
+
| Jira says "fix sorting", but doesn't specify sort criteria | Feature exists | Feature exists | **Requirement ambiguity (HIGH)** | BLOCK, ask which sort criteria |
|
|
6648
|
+
|
|
6649
|
+
**Partial Feature Existence \u2014 URL found but requested functionality absent:**
|
|
6650
|
+
|
|
6651
|
+
A common edge case: a page/route loads successfully, but the SPECIFIC FUNCTIONALITY you were asked to test doesn't exist on it.
|
|
6652
|
+
|
|
6653
|
+
**Rule:** Evaluate whether the REQUESTED FUNCTIONALITY exists, not just whether a URL resolves.
|
|
6654
|
+
|
|
6655
|
+
| Page Exists | Requested Features Exist | Authoritative Trigger | Classification |
|
|
6656
|
+
|-------------|--------------------------|----------------------|----------------|
|
|
6657
|
+
| Yes | Yes | Any | Proceed normally |
|
|
6658
|
+
| Yes | No | Yes (Jira/PR says features built) | Execution obstacle \u2014 features behind flag/env |
|
|
6659
|
+
| Yes | No | No (manual request only) | **Requirement ambiguity (CRITICAL)** \u2014 ask what's expected |
|
|
6660
|
+
| No | N/A | Yes | Execution obstacle \u2014 page not deployed yet |
|
|
6661
|
+
| No | N/A | No | **Requirement ambiguity (CRITICAL)** \u2014 ask what was meant |
|
|
6662
|
+
|
|
6663
|
+
**Example:** Prompt says "Test the checkout payment form with credit card 4111..." You browse to /checkout and find an information form (first name, last name, postal code) but NO payment form, NO shipping options, NO Place Order button. No Jira/PR claims these features exist. \u2192 **CRITICAL requirement ambiguity.** Ask: "I found a checkout information form at /checkout but no payment form or shipping options. Can you clarify what checkout features you'd like tested?"
|
|
6664
|
+
|
|
6665
|
+
**Key insight:** Finding a URL is not the same as finding the requested functionality. Do NOT classify this as an "execution obstacle" just because the page loads.
|
|
6666
|
+
|
|
6588
6667
|
### Check Memory for Similar Clarifications
|
|
6589
6668
|
|
|
6590
6669
|
Before asking, check if similar question was answered:
|
|
@@ -6730,7 +6809,7 @@ When reporting test results, always include an "Ambiguities" section if clarific
|
|
|
6730
6809
|
## Remember
|
|
6731
6810
|
|
|
6732
6811
|
- **STOP means STOP** - When you hit a STOP threshold, you MUST call team-communicator to ask via Slack. Do NOT silently adapt, skip, or work around the issue
|
|
6733
|
-
- **Non-existent features
|
|
6812
|
+
- **Non-existent features \u2014 check context first** - If a page/feature doesn't exist in the browser, check whether an authoritative trigger (Jira, PR, team request) asserts it exists. If YES \u2192 execution obstacle (proceed with artifact creation, notify team). If NO authoritative source claims it exists \u2192 CRITICAL severity, ask what was meant
|
|
6734
6813
|
- **Ask correctly > guess poorly** - Specific questions lead to specific answers
|
|
6735
6814
|
- **Never invent success criteria** - If the task says "improve" or "fix" without metrics, ask what "done" looks like
|
|
6736
6815
|
- **Check memory first** - Avoid re-asking previously answered questions
|
|
@@ -7697,8 +7776,10 @@ function buildComposedTaskDefinition(taskSlug, projectSubAgents) {
|
|
|
7697
7776
|
const configured = projectSubAgents.find((sa) => sa.role === role);
|
|
7698
7777
|
if (configured) {
|
|
7699
7778
|
const integrationMeta = getIntegration(configured.integration);
|
|
7700
|
-
|
|
7701
|
-
|
|
7779
|
+
if (integrationMeta?.requiredMCP) {
|
|
7780
|
+
const mcpProvider = integrationMeta.provider || configured.integration;
|
|
7781
|
+
requiredMCPs.add(mcpProvider);
|
|
7782
|
+
}
|
|
7702
7783
|
}
|
|
7703
7784
|
}
|
|
7704
7785
|
const content = contentParts.join("\n\n");
|