npm - @yasserkhanorg/e2e-agents - Versions diffs - 1.8.3 → 1.8.5 - Mend

@yasserkhanorg/e2e-agents 1.8.3 → 1.8.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/cli/commands/plan_crew.d.ts.map +1 -1
package/dist/cli/commands/plan_crew.js +111 -68
package/dist/esm/cli/commands/plan_crew.js +111 -68
package/package.json +1 -1

package/dist/cli/commands/plan_crew.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"plan_crew.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/plan_crew.ts"],"names":[],"mappings":"AAMA,OAAO,KAAK,EAAC,WAAW,EAAC,MAAM,uBAAuB,CAAC;AACvD,OAAO,KAAK,EAAC,gBAAgB,EAAE,UAAU,EAAC,MAAM,qBAAqB,CAAC;AAUtE,OAAO,KAAK,EAAC,UAAU,EAAC,MAAM,aAAa,CAAC;AAgC5C,wBAAsB,mBAAmB,CAAC,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,WAAW,EAAE,IAAI,EAAE,UAAU,GAAG,OAAO,CAAC,gBAAgB,CAAC,CAkD5H;~~AAED~~,wBAAgB,iBAAiB,CAAC,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG,MAAM,~~CAuEnF~~;AAED,wBAAgB,mBAAmB,CAAC,YAAY,EAAE,MAAM,EAAE,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG,MAAM,CAE3G;AAED;;;GAGG;AACH,wBAAgB,iBAAiB,CAAC,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG,MAAM,~~CAuHnF~~;AAED,wBAAgB,kBAAkB,CAAC,UAAU,EAAE,MAAM,EAAE,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG;IAAC,eAAe,EAAE,MAAM,CAAC;IAAC,gBAAgB,EAAE,MAAM,CAAC;IAAC,gBAAgB,EAAE,MAAM,CAAA;CAAC,CAa/K"}
1	+ {"version":3,"file":"plan_crew.d.ts","sourceRoot":"","sources":["../../../src/cli/commands/plan_crew.ts"],"names":[],"mappings":"AAMA,OAAO,KAAK,EAAC,WAAW,EAAC,MAAM,uBAAuB,CAAC;AACvD,OAAO,KAAK,EAAC,gBAAgB,EAAE,UAAU,EAAC,MAAM,qBAAqB,CAAC;AAUtE,OAAO,KAAK,EAAC,UAAU,EAAC,MAAM,aAAa,CAAC;AAgC5C,wBAAsB,mBAAmB,CAAC,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,WAAW,EAAE,IAAI,EAAE,UAAU,GAAG,OAAO,CAAC,gBAAgB,CAAC,CAkD5H;AAWD,wBAAgB,iBAAiB,CAAC,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG,MAAM,CAwEnF;AAED,wBAAgB,mBAAmB,CAAC,YAAY,EAAE,MAAM,EAAE,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG,MAAM,CAE3G;AAED;;;GAGG;AACH,wBAAgB,iBAAiB,CAAC,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG,MAAM,CAsJnF;AAED,wBAAgB,kBAAkB,CAAC,UAAU,EAAE,MAAM,EAAE,IAAI,EAAE,gBAAgB,EAAE,IAAI,CAAC,EAAE,UAAU,GAAG;IAAC,eAAe,EAAE,MAAM,CAAC;IAAC,gBAAgB,EAAE,MAAM,CAAC;IAAC,gBAAgB,EAAE,MAAM,CAAA;CAAC,CAa/K"}

package/dist/cli/commands/plan_crew.js CHANGED Viewed

@@ -85,25 +85,37 @@ async function runPlanCrewAnalysis(plan, config, args) {
         timings: result.timings,
     };
 }
+/**
+ * Match a strategy/design entry against a set of gap family IDs.
+ */
+function matchesGapFamily(flowId, flowName, gapFamilies) {
+    return Array.from(gapFamilies).some((fam) => flowId.startsWith(fam) || flowName.toLowerCase().includes(fam.replace(/_/g, ' ')));
+}
 function buildCrewMarkdown(crew, plan) {
     const totalCases = crew.testDesigns.reduce((n, td) => n + td.testCases.length, 0);
     const gapFamilies = new Set((plan?.gapDetails ?? []).map((g) => g.id));
-    const gapDesigns = gapFamilies.size > 0
-        ? crew.testDesigns.filter((td) => Array.from(gapFamilies).some((fam) => td.flowId.startsWith(fam) || td.flowName.toLowerCase().includes(fam.replace(/_/g, ' '))))
-        : [];
-    const gapCases = gapDesigns.reduce((n, td) => n + td.testCases.length, 0);
-    const gapP0Cases = gapDesigns.reduce((n, td) => n + td.testCases.filter((tc) => tc.priority === 'P0').length, 0);
     const lines = [
-        '### Crew Insights',
+        '### Crew Analysis — What to Test',
+        '',
+        `Crew analyzed the diff and recommends what to verify before merging.`,
         '',
-        `Workflow: \`${crew.workflow}\``,
-        `Impacted flows: **${crew.summary.impactedFlows}**`,
-        `Structured test designs: **${crew.summary.testDesigns}** flows, **${totalCases}** test cases`,
+        `Impacted flows: **${crew.summary.impactedFlows}** | Strategy entries: **${crew.summary.strategyEntries}**`,
     ];
-    if (gapFamilies.size > 0 && gapDesigns.length > 0) {
-        lines.push(`Gap-focused: **${gapDesigns.length}** flows, **${gapCases}** test cases (**${gapP0Cases}** P0)`);
+    if (totalCases > 0) {
+        const gapDesigns = gapFamilies.size > 0
+            ? crew.testDesigns.filter((td) => matchesGapFamily(td.flowId, td.flowName, gapFamilies))
+            : [];
+        const gapCases = gapDesigns.reduce((n, td) => n + td.testCases.length, 0);
+        const gapP0Cases = gapDesigns.reduce((n, td) => n + td.testCases.filter((tc) => tc.priority === 'P0').length, 0);
+        lines.push(`Structured test designs: **${crew.summary.testDesigns}** flows, **${totalCases}** test cases`);
+        if (gapDesigns.length > 0) {
+            lines.push(`Gap-focused: **${gapDesigns.length}** flows, **${gapCases}** test cases (**${gapP0Cases}** P0)`);
+        }
+    }
+    if (crew.summary.crossImpacts > 0) {
+        lines.push(`Cross-impacts: **${crew.summary.crossImpacts}** (${crew.summary.highRiskCrossImpacts} high risk)`);
     }
-    lines.push(`Cross-impacts: **${crew.summary.crossImpacts}** (${crew.summary.highRiskCrossImpacts} high risk)`, `Estimated AI cost: **$${crew.summary.totalCostUSD.toFixed(4)}**`);
+    lines.push(`Estimated AI cost: **$${crew.summary.totalCostUSD.toFixed(4)}**`);
     if (crew.strategyEntries.length > 0) {
         lines.push('');
         lines.push('Top Strategy Recommendations:');
@@ -151,14 +163,18 @@ function appendCrewToSummary(baseMarkdown, crew, plan) {
  */
 function buildCrewTestPlan(crew, plan) {
     const gapFamilies = new Set((plan?.gapDetails ?? []).map((g) => g.id));
+    const hasTestDesigns = crew.testDesigns.length > 0;
     const totalCases = crew.testDesigns.reduce((n, td) => n + td.testCases.length, 0);
-    // Split designs into gap-related and coverage-expansion
+    // Split strategy entries into gap-related and covered
+    const gapStrategies = gapFamilies.size > 0
+        ? crew.strategyEntries.filter((s) => matchesGapFamily(s.flowId, s.flowName, gapFamilies))
+        : [];
+    const coveredStrategies = crew.strategyEntries.filter((s) => !gapStrategies.includes(s));
+    // Split test designs (if present) into gap-related and covered
     const gapDesigns = [];
     const coveredDesigns = [];
     for (const td of crew.testDesigns) {
-        // Match by flowId prefix against gap family ids
-        const isGap = Array.from(gapFamilies).some((fam) => td.flowId.startsWith(fam) || td.flowName.toLowerCase().includes(fam.replace(/_/g, ' ')));
-        if (isGap) {
+        if (matchesGapFamily(td.flowId, td.flowName, gapFamilies)) {
             gapDesigns.push(td);
         }
         else {
@@ -168,90 +184,117 @@ function buildCrewTestPlan(crew, plan) {
     const gapCases = gapDesigns.reduce((n, td) => n + td.testCases.length, 0);
     const coveredCases = coveredDesigns.reduce((n, td) => n + td.testCases.length, 0);
     const lines = [
-        '# Crew Test Plan',
+        '# Crew Test Plan — What to Verify',
         '',
-        `> Auto-generated by e2e-agents crew (\`${crew.workflow}\` workflow)`,
+        '> **This is a test recommendation, not a test execution report.**',
+        '> Crew analyzed the code diff and identified what needs to be tested.',
+        '> Use this plan to guide manual QA or write automated E2E tests.',
+        '',
+        `_Auto-generated by e2e-agents crew (\`${crew.workflow}\` workflow)_`,
         '',
         '## Summary',
         '',
         `| Metric | Count |`,
         `|--------|-------|`,
-        `| Gap flows (missing tests) | ${gapDesigns.length} flows, **${gapCases} test cases** |`,
-        `| Covered flows (expansion) | ${coveredDesigns.length} flows, ${coveredCases} test cases |`,
-        `| Total | ${crew.testDesigns.length} flows, ${totalCases} test cases |`,
+        `| Gap flows — **no existing tests, must verify** | ${gapStrategies.length} flows${hasTestDesigns ? `, **${gapCases} test cases**` : ''} |`,
+        `| Covered flows — **has tests, verify no regressions** | ${coveredStrategies.length} flows${hasTestDesigns ? `, ${coveredCases} test cases` : ''} |`,
+        `| Total | ${crew.strategyEntries.length} flows${hasTestDesigns ? `, ${totalCases} test cases` : ''} |`,
         `| High-risk cross-impacts | ${crew.summary.highRiskCrossImpacts} |`,
         `| AI cost | $${crew.summary.totalCostUSD.toFixed(4)} |`,
         '',
     ];
-    // Priority action items
-    if (gapDesigns.length > 0) {
-        lines.push('## Priority: Gap Flows (Missing Tests)');
+    // ── Gap flows ──
+    if (gapStrategies.length > 0) {
+        lines.push('## Action Required: Gap Flows (No Existing Tests)');
         lines.push('');
-        lines.push('These flows have **no existing E2E coverage** and should be addressed first.');
+        lines.push('These flows have **no automated E2E coverage**. Before merging, either:');
+        lines.push('1. **Write E2E tests** for the critical scenarios below, or');
+        lines.push('2. **Manually verify** each flow works as expected');
         lines.push('');
-        for (const td of gapDesigns) {
-            const strategy = crew.strategyEntries.find((s) => s.flowId === td.flowId);
-            const approach = strategy?.approach ?? 'full-test';
-            const risk = strategy?.crossImpactRisk ?? 'unknown';
-            const p0Cases = td.testCases.filter((tc) => tc.priority === 'P0');
-            const p1Cases = td.testCases.filter((tc) => tc.priority === 'P1');
-            lines.push(`### ${td.flowName}`);
+        for (const strategy of gapStrategies) {
+            const td = crew.testDesigns.find((d) => d.flowId === strategy.flowId);
+            lines.push(`### ${strategy.flowName}`);
             lines.push('');
-            lines.push(`Strategy: **${approach}** | Cross-impact risk: **${risk}** | ${td.testCases.length} cases (${p0Cases.length} P0, ${p1Cases.length} P1)`);
+            const actionVerb = strategy.approach === 'full-test' ? 'Write full E2E test or verify manually'
+                : strategy.approach === 'smoke-test' ? 'Smoke-test manually or add basic E2E coverage'
+                    : strategy.approach === 'manual-review' ? 'Manual review required'
+                        : 'Can skip — low risk';
+            lines.push(`**${strategy.priority}** | Recommended: **${strategy.approach}** | Cross-impact risk: **${strategy.crossImpactRisk}**`);
+            lines.push(`> ${actionVerb}`);
+            if (strategy.rationale && !strategy.rationale.includes('Default strategy')) {
+                lines.push(`> Rationale: ${strategy.rationale}`);
+            }
+            if (strategy.testCategories.length > 0) {
+                lines.push(`> Test types to cover: ${strategy.testCategories.join(', ')}`);
+            }
             lines.push('');
-            // Show P0 cases expanded
-            if (p0Cases.length > 0) {
-                lines.push('**P0 — Must test:**');
-                lines.push('');
-                for (const tc of p0Cases) {
-                    lines.push(`- [ ] **${tc.name}** (${tc.type})`);
-                    if (tc.preconditions.length > 0) {
-                        lines.push(`  - Preconditions: ${tc.preconditions.join('; ')}`);
+            // If test designs exist, show P0/P1 cases
+            if (td && td.testCases.length > 0) {
+                const p0Cases = td.testCases.filter((tc) => tc.priority === 'P0');
+                const p1Cases = td.testCases.filter((tc) => tc.priority === 'P1');
+                if (p0Cases.length > 0) {
+                    lines.push('**P0 — Must test:**');
+                    lines.push('');
+                    for (const tc of p0Cases) {
+                        lines.push(`- [ ] **${tc.name}** (${tc.type})`);
+                        if (tc.preconditions.length > 0) {
+                            lines.push(`  - Preconditions: ${tc.preconditions.join('; ')}`);
+                        }
+                        lines.push(`  - Steps: ${tc.steps.join(' → ')}`);
+                        lines.push(`  - Expected: ${tc.expectedOutcome}`);
                     }
-                    lines.push(`  - Steps: ${tc.steps.join(' → ')}`);
-                    lines.push(`  - Expected: ${tc.expectedOutcome}`);
+                    lines.push('');
                 }
-                lines.push('');
-            }
-            // Show P1 as a collapsed checklist
-            if (p1Cases.length > 0) {
-                lines.push(`<details><summary>P1 — Should test (${p1Cases.length})</summary>`);
-                lines.push('');
-                for (const tc of p1Cases) {
-                    lines.push(`- [ ] **${tc.name}** (${tc.type}) — ${tc.expectedOutcome}`);
+                if (p1Cases.length > 0) {
+                    lines.push(`<details><summary>P1 — Should test (${p1Cases.length})</summary>`);
+                    lines.push('');
+                    for (const tc of p1Cases) {
+                        lines.push(`- [ ] **${tc.name}** (${tc.type}) — ${tc.expectedOutcome}`);
+                    }
+                    lines.push('');
+                    lines.push('</details>');
+                    lines.push('');
                 }
-                lines.push('');
-                lines.push('</details>');
-                lines.push('');
             }
         }
     }
-    // Covered flow expansion — collapsed by default
-    if (coveredDesigns.length > 0) {
-        lines.push('## Covered Flows (Regression / Expansion)');
+    // ── Covered flows ──
+    if (coveredStrategies.length > 0) {
+        lines.push('## Regression Check: Covered Flows (Already Have Tests)');
         lines.push('');
-        lines.push('These flows already have specs. The test cases below extend coverage for changes in this PR.');
+        lines.push('These flows have existing E2E specs. The existing tests should catch regressions automatically.');
+        lines.push('**No manual action required** unless CI tests fail on these flows.');
         lines.push('');
-        for (const td of coveredDesigns) {
-            const strategy = crew.strategyEntries.find((s) => s.flowId === td.flowId);
-            const approach = strategy?.approach ?? 'smoke-test';
-            const p0Count = td.testCases.filter((tc) => tc.priority === 'P0').length;
-            lines.push(`<details><summary><strong>${td.flowName}</strong> — ${approach} | ${td.testCases.length} cases (${p0Count} P0)</summary>`);
+        for (const strategy of coveredStrategies) {
+            const td = crew.testDesigns.find((d) => d.flowId === strategy.flowId);
+            const caseCount = td ? td.testCases.length : 0;
+            const detail = caseCount > 0 ? ` | ${caseCount} cases` : '';
+            lines.push(`<details><summary><strong>${strategy.flowName}</strong> — ${strategy.approach}${detail} (${strategy.priority})</summary>`);
             lines.push('');
-            for (const tc of td.testCases) {
-                lines.push(`- [ ] **${tc.name}** (${tc.priority}, ${tc.type}) — ${tc.expectedOutcome}`);
+            lines.push(`Existing tests should cover this. Cross-impact risk: ${strategy.crossImpactRisk}`);
+            if (strategy.rationale && !strategy.rationale.includes('Default strategy')) {
+                lines.push(`> ${strategy.rationale}`);
+            }
+            if (strategy.testCategories.length > 0) {
+                lines.push(`Test categories: ${strategy.testCategories.join(', ')}`);
+            }
+            if (td && td.testCases.length > 0) {
+                lines.push('');
+                for (const tc of td.testCases) {
+                    lines.push(`- [ ] **${tc.name}** (${tc.priority}, ${tc.type}) — ${tc.expectedOutcome}`);
+                }
             }
             lines.push('');
             lines.push('</details>');
             lines.push('');
         }
     }
-    // Cross-impacts section
+    // ── Cross-impacts ──
     const highRisk = crew.crossImpacts.filter((ci) => ci.riskLevel === 'high');
     if (highRisk.length > 0) {
-        lines.push('## High-Risk Cross-Impacts');
+        lines.push('## High-Risk Cross-Impacts — Verify Before Release');
         lines.push('');
-        lines.push('These cross-family dependencies should be verified during release testing:');
+        lines.push('Changes in one area may break these related areas. Manually verify or ensure E2E tests cover both sides:');
         lines.push('');
         for (const ci of highRisk) {
             lines.push(`- **${ci.sourceFamily}** → **${ci.affectedFamily}**: ${ci.sharedDependency}`);

package/dist/esm/cli/commands/plan_crew.js CHANGED Viewed

@@ -78,25 +78,37 @@ export async function runPlanCrewAnalysis(plan, config, args) {
         timings: result.timings,
     };
 }
+/**
+ * Match a strategy/design entry against a set of gap family IDs.
+ */
+function matchesGapFamily(flowId, flowName, gapFamilies) {
+    return Array.from(gapFamilies).some((fam) => flowId.startsWith(fam) || flowName.toLowerCase().includes(fam.replace(/_/g, ' ')));
+}
 export function buildCrewMarkdown(crew, plan) {
     const totalCases = crew.testDesigns.reduce((n, td) => n + td.testCases.length, 0);
     const gapFamilies = new Set((plan?.gapDetails ?? []).map((g) => g.id));
-    const gapDesigns = gapFamilies.size > 0
-        ? crew.testDesigns.filter((td) => Array.from(gapFamilies).some((fam) => td.flowId.startsWith(fam) || td.flowName.toLowerCase().includes(fam.replace(/_/g, ' '))))
-        : [];
-    const gapCases = gapDesigns.reduce((n, td) => n + td.testCases.length, 0);
-    const gapP0Cases = gapDesigns.reduce((n, td) => n + td.testCases.filter((tc) => tc.priority === 'P0').length, 0);
     const lines = [
-        '### Crew Insights',
+        '### Crew Analysis — What to Test',
+        '',
+        `Crew analyzed the diff and recommends what to verify before merging.`,
         '',
-        `Workflow: \`${crew.workflow}\``,
-        `Impacted flows: **${crew.summary.impactedFlows}**`,
-        `Structured test designs: **${crew.summary.testDesigns}** flows, **${totalCases}** test cases`,
+        `Impacted flows: **${crew.summary.impactedFlows}** | Strategy entries: **${crew.summary.strategyEntries}**`,
     ];
-    if (gapFamilies.size > 0 && gapDesigns.length > 0) {
-        lines.push(`Gap-focused: **${gapDesigns.length}** flows, **${gapCases}** test cases (**${gapP0Cases}** P0)`);
+    if (totalCases > 0) {
+        const gapDesigns = gapFamilies.size > 0
+            ? crew.testDesigns.filter((td) => matchesGapFamily(td.flowId, td.flowName, gapFamilies))
+            : [];
+        const gapCases = gapDesigns.reduce((n, td) => n + td.testCases.length, 0);
+        const gapP0Cases = gapDesigns.reduce((n, td) => n + td.testCases.filter((tc) => tc.priority === 'P0').length, 0);
+        lines.push(`Structured test designs: **${crew.summary.testDesigns}** flows, **${totalCases}** test cases`);
+        if (gapDesigns.length > 0) {
+            lines.push(`Gap-focused: **${gapDesigns.length}** flows, **${gapCases}** test cases (**${gapP0Cases}** P0)`);
+        }
+    }
+    if (crew.summary.crossImpacts > 0) {
+        lines.push(`Cross-impacts: **${crew.summary.crossImpacts}** (${crew.summary.highRiskCrossImpacts} high risk)`);
     }
-    lines.push(`Cross-impacts: **${crew.summary.crossImpacts}** (${crew.summary.highRiskCrossImpacts} high risk)`, `Estimated AI cost: **$${crew.summary.totalCostUSD.toFixed(4)}**`);
+    lines.push(`Estimated AI cost: **$${crew.summary.totalCostUSD.toFixed(4)}**`);
     if (crew.strategyEntries.length > 0) {
         lines.push('');
         lines.push('Top Strategy Recommendations:');
@@ -144,14 +156,18 @@ export function appendCrewToSummary(baseMarkdown, crew, plan) {
  */
 export function buildCrewTestPlan(crew, plan) {
     const gapFamilies = new Set((plan?.gapDetails ?? []).map((g) => g.id));
+    const hasTestDesigns = crew.testDesigns.length > 0;
     const totalCases = crew.testDesigns.reduce((n, td) => n + td.testCases.length, 0);
-    // Split designs into gap-related and coverage-expansion
+    // Split strategy entries into gap-related and covered
+    const gapStrategies = gapFamilies.size > 0
+        ? crew.strategyEntries.filter((s) => matchesGapFamily(s.flowId, s.flowName, gapFamilies))
+        : [];
+    const coveredStrategies = crew.strategyEntries.filter((s) => !gapStrategies.includes(s));
+    // Split test designs (if present) into gap-related and covered
     const gapDesigns = [];
     const coveredDesigns = [];
     for (const td of crew.testDesigns) {
-        // Match by flowId prefix against gap family ids
-        const isGap = Array.from(gapFamilies).some((fam) => td.flowId.startsWith(fam) || td.flowName.toLowerCase().includes(fam.replace(/_/g, ' ')));
-        if (isGap) {
+        if (matchesGapFamily(td.flowId, td.flowName, gapFamilies)) {
             gapDesigns.push(td);
         }
         else {
@@ -161,90 +177,117 @@ export function buildCrewTestPlan(crew, plan) {
     const gapCases = gapDesigns.reduce((n, td) => n + td.testCases.length, 0);
     const coveredCases = coveredDesigns.reduce((n, td) => n + td.testCases.length, 0);
     const lines = [
-        '# Crew Test Plan',
+        '# Crew Test Plan — What to Verify',
         '',
-        `> Auto-generated by e2e-agents crew (\`${crew.workflow}\` workflow)`,
+        '> **This is a test recommendation, not a test execution report.**',
+        '> Crew analyzed the code diff and identified what needs to be tested.',
+        '> Use this plan to guide manual QA or write automated E2E tests.',
+        '',
+        `_Auto-generated by e2e-agents crew (\`${crew.workflow}\` workflow)_`,
         '',
         '## Summary',
         '',
         `| Metric | Count |`,
         `|--------|-------|`,
-        `| Gap flows (missing tests) | ${gapDesigns.length} flows, **${gapCases} test cases** |`,
-        `| Covered flows (expansion) | ${coveredDesigns.length} flows, ${coveredCases} test cases |`,
-        `| Total | ${crew.testDesigns.length} flows, ${totalCases} test cases |`,
+        `| Gap flows — **no existing tests, must verify** | ${gapStrategies.length} flows${hasTestDesigns ? `, **${gapCases} test cases**` : ''} |`,
+        `| Covered flows — **has tests, verify no regressions** | ${coveredStrategies.length} flows${hasTestDesigns ? `, ${coveredCases} test cases` : ''} |`,
+        `| Total | ${crew.strategyEntries.length} flows${hasTestDesigns ? `, ${totalCases} test cases` : ''} |`,
         `| High-risk cross-impacts | ${crew.summary.highRiskCrossImpacts} |`,
         `| AI cost | $${crew.summary.totalCostUSD.toFixed(4)} |`,
         '',
     ];
-    // Priority action items
-    if (gapDesigns.length > 0) {
-        lines.push('## Priority: Gap Flows (Missing Tests)');
+    // ── Gap flows ──
+    if (gapStrategies.length > 0) {
+        lines.push('## Action Required: Gap Flows (No Existing Tests)');
         lines.push('');
-        lines.push('These flows have **no existing E2E coverage** and should be addressed first.');
+        lines.push('These flows have **no automated E2E coverage**. Before merging, either:');
+        lines.push('1. **Write E2E tests** for the critical scenarios below, or');
+        lines.push('2. **Manually verify** each flow works as expected');
         lines.push('');
-        for (const td of gapDesigns) {
-            const strategy = crew.strategyEntries.find((s) => s.flowId === td.flowId);
-            const approach = strategy?.approach ?? 'full-test';
-            const risk = strategy?.crossImpactRisk ?? 'unknown';
-            const p0Cases = td.testCases.filter((tc) => tc.priority === 'P0');
-            const p1Cases = td.testCases.filter((tc) => tc.priority === 'P1');
-            lines.push(`### ${td.flowName}`);
+        for (const strategy of gapStrategies) {
+            const td = crew.testDesigns.find((d) => d.flowId === strategy.flowId);
+            lines.push(`### ${strategy.flowName}`);
             lines.push('');
-            lines.push(`Strategy: **${approach}** | Cross-impact risk: **${risk}** | ${td.testCases.length} cases (${p0Cases.length} P0, ${p1Cases.length} P1)`);
+            const actionVerb = strategy.approach === 'full-test' ? 'Write full E2E test or verify manually'
+                : strategy.approach === 'smoke-test' ? 'Smoke-test manually or add basic E2E coverage'
+                    : strategy.approach === 'manual-review' ? 'Manual review required'
+                        : 'Can skip — low risk';
+            lines.push(`**${strategy.priority}** | Recommended: **${strategy.approach}** | Cross-impact risk: **${strategy.crossImpactRisk}**`);
+            lines.push(`> ${actionVerb}`);
+            if (strategy.rationale && !strategy.rationale.includes('Default strategy')) {
+                lines.push(`> Rationale: ${strategy.rationale}`);
+            }
+            if (strategy.testCategories.length > 0) {
+                lines.push(`> Test types to cover: ${strategy.testCategories.join(', ')}`);
+            }
             lines.push('');
-            // Show P0 cases expanded
-            if (p0Cases.length > 0) {
-                lines.push('**P0 — Must test:**');
-                lines.push('');
-                for (const tc of p0Cases) {
-                    lines.push(`- [ ] **${tc.name}** (${tc.type})`);
-                    if (tc.preconditions.length > 0) {
-                        lines.push(`  - Preconditions: ${tc.preconditions.join('; ')}`);
+            // If test designs exist, show P0/P1 cases
+            if (td && td.testCases.length > 0) {
+                const p0Cases = td.testCases.filter((tc) => tc.priority === 'P0');
+                const p1Cases = td.testCases.filter((tc) => tc.priority === 'P1');
+                if (p0Cases.length > 0) {
+                    lines.push('**P0 — Must test:**');
+                    lines.push('');
+                    for (const tc of p0Cases) {
+                        lines.push(`- [ ] **${tc.name}** (${tc.type})`);
+                        if (tc.preconditions.length > 0) {
+                            lines.push(`  - Preconditions: ${tc.preconditions.join('; ')}`);
+                        }
+                        lines.push(`  - Steps: ${tc.steps.join(' → ')}`);
+                        lines.push(`  - Expected: ${tc.expectedOutcome}`);
                     }
-                    lines.push(`  - Steps: ${tc.steps.join(' → ')}`);
-                    lines.push(`  - Expected: ${tc.expectedOutcome}`);
+                    lines.push('');
                 }
-                lines.push('');
-            }
-            // Show P1 as a collapsed checklist
-            if (p1Cases.length > 0) {
-                lines.push(`<details><summary>P1 — Should test (${p1Cases.length})</summary>`);
-                lines.push('');
-                for (const tc of p1Cases) {
-                    lines.push(`- [ ] **${tc.name}** (${tc.type}) — ${tc.expectedOutcome}`);
+                if (p1Cases.length > 0) {
+                    lines.push(`<details><summary>P1 — Should test (${p1Cases.length})</summary>`);
+                    lines.push('');
+                    for (const tc of p1Cases) {
+                        lines.push(`- [ ] **${tc.name}** (${tc.type}) — ${tc.expectedOutcome}`);
+                    }
+                    lines.push('');
+                    lines.push('</details>');
+                    lines.push('');
                 }
-                lines.push('');
-                lines.push('</details>');
-                lines.push('');
             }
         }
     }
-    // Covered flow expansion — collapsed by default
-    if (coveredDesigns.length > 0) {
-        lines.push('## Covered Flows (Regression / Expansion)');
+    // ── Covered flows ──
+    if (coveredStrategies.length > 0) {
+        lines.push('## Regression Check: Covered Flows (Already Have Tests)');
         lines.push('');
-        lines.push('These flows already have specs. The test cases below extend coverage for changes in this PR.');
+        lines.push('These flows have existing E2E specs. The existing tests should catch regressions automatically.');
+        lines.push('**No manual action required** unless CI tests fail on these flows.');
         lines.push('');
-        for (const td of coveredDesigns) {
-            const strategy = crew.strategyEntries.find((s) => s.flowId === td.flowId);
-            const approach = strategy?.approach ?? 'smoke-test';
-            const p0Count = td.testCases.filter((tc) => tc.priority === 'P0').length;
-            lines.push(`<details><summary><strong>${td.flowName}</strong> — ${approach} | ${td.testCases.length} cases (${p0Count} P0)</summary>`);
+        for (const strategy of coveredStrategies) {
+            const td = crew.testDesigns.find((d) => d.flowId === strategy.flowId);
+            const caseCount = td ? td.testCases.length : 0;
+            const detail = caseCount > 0 ? ` | ${caseCount} cases` : '';
+            lines.push(`<details><summary><strong>${strategy.flowName}</strong> — ${strategy.approach}${detail} (${strategy.priority})</summary>`);
             lines.push('');
-            for (const tc of td.testCases) {
-                lines.push(`- [ ] **${tc.name}** (${tc.priority}, ${tc.type}) — ${tc.expectedOutcome}`);
+            lines.push(`Existing tests should cover this. Cross-impact risk: ${strategy.crossImpactRisk}`);
+            if (strategy.rationale && !strategy.rationale.includes('Default strategy')) {
+                lines.push(`> ${strategy.rationale}`);
+            }
+            if (strategy.testCategories.length > 0) {
+                lines.push(`Test categories: ${strategy.testCategories.join(', ')}`);
+            }
+            if (td && td.testCases.length > 0) {
+                lines.push('');
+                for (const tc of td.testCases) {
+                    lines.push(`- [ ] **${tc.name}** (${tc.priority}, ${tc.type}) — ${tc.expectedOutcome}`);
+                }
             }
             lines.push('');
             lines.push('</details>');
             lines.push('');
         }
     }
-    // Cross-impacts section
+    // ── Cross-impacts ──
     const highRisk = crew.crossImpacts.filter((ci) => ci.riskLevel === 'high');
     if (highRisk.length > 0) {
-        lines.push('## High-Risk Cross-Impacts');
+        lines.push('## High-Risk Cross-Impacts — Verify Before Release');
         lines.push('');
-        lines.push('These cross-family dependencies should be verified during release testing:');
+        lines.push('Changes in one area may break these related areas. Manually verify or ensure E2E tests cover both sides:');
         lines.push('');
         for (const ci of highRisk) {
             lines.push(`- **${ci.sourceFamily}** → **${ci.affectedFamily}**: ${ci.sharedDependency}`);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@yasserkhanorg/e2e-agents",
-  "version": "1.8.3",
+  "version": "1.8.5",
   "description": "AI-powered E2E test impact analysis, generation, and healing. Analyzes code changes to identify affected Playwright tests, detects coverage gaps, and generates or repairs specs using pluggable LLM providers (Claude, OpenAI, Ollama). Includes MCP server, traceability, and CI/CD integration.",
   "main": "dist/index.js",
   "module": "dist/esm/index.js",