npm - explorbot - Versions diffs - 0.1.10 → 0.1.11 - Mend

explorbot 0.1.10 → 0.1.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

package/README.md +27 -1
package/bin/explorbot-cli.ts +27 -18
package/dist/bin/explorbot-cli.js +26 -18
package/dist/package.json +2 -2
package/dist/rules/navigator/output.md +9 -0
package/dist/rules/navigator/verification-actions.md +2 -0
package/dist/src/action-result.js +23 -1
package/dist/src/action.js +46 -38
package/dist/src/ai/bosun.js +11 -1
package/dist/src/ai/conversation.js +39 -0
package/dist/src/ai/historian/codeceptjs.js +109 -0
package/dist/src/ai/historian/experience.js +320 -0
package/dist/src/ai/historian/mixin.js +2 -0
package/dist/src/ai/historian/playwright.js +145 -0
package/dist/src/ai/historian/utils.js +18 -0
package/dist/src/ai/historian.js +19 -405
package/dist/src/ai/navigator.js +82 -29
package/dist/src/ai/pilot.js +232 -13
package/dist/src/ai/planner.js +29 -9
package/dist/src/ai/provider.js +54 -17
package/dist/src/ai/researcher.js +41 -32
package/dist/src/ai/rules.js +26 -14
package/dist/src/ai/tester.js +90 -26
package/dist/src/ai/tools.js +13 -7
package/dist/src/browser-server.js +16 -3
package/dist/src/commands/add-rule-command.js +11 -8
package/dist/src/commands/clean-command.js +2 -1
package/dist/src/commands/explore-command.js +27 -15
package/dist/src/commands/init-command.js +9 -8
package/dist/src/commands/plan-command.js +32 -0
package/dist/src/commands/plan-save-command.js +19 -7
package/dist/src/commands/rerun-command.js +4 -0
package/dist/src/components/App.js +15 -5
package/dist/src/execution-controller.js +13 -2
package/dist/src/experience-tracker.js +20 -64
package/dist/src/explorbot.js +5 -8
package/dist/src/explorer.js +9 -2
package/dist/src/observability.js +50 -99
package/dist/src/playwright-recorder.js +309 -0
package/dist/src/test-plan.js +12 -0
package/dist/src/utils/aria.js +37 -1
package/dist/src/utils/error-page.js +20 -7
package/dist/src/utils/next-steps.js +37 -0
package/package.json +2 -2
package/rules/navigator/output.md +9 -0
package/rules/navigator/verification-actions.md +2 -0
package/src/action-result.ts +26 -1
package/src/action.ts +44 -37
package/src/ai/bosun.ts +11 -1
package/src/ai/conversation.ts +37 -0
package/src/ai/historian/codeceptjs.ts +130 -0
package/src/ai/historian/experience.ts +383 -0
package/src/ai/historian/mixin.ts +4 -0
package/src/ai/historian/playwright.ts +169 -0
package/src/ai/historian/utils.ts +23 -0
package/src/ai/historian.ts +35 -473
package/src/ai/navigator.ts +82 -29
package/src/ai/pilot.ts +237 -14
package/src/ai/planner.ts +29 -9
package/src/ai/provider.ts +51 -17
package/src/ai/researcher.ts +45 -33
package/src/ai/rules.ts +27 -14
package/src/ai/tester.ts +94 -26
package/src/ai/tools.ts +47 -25
package/src/browser-server.ts +17 -3
package/src/commands/add-rule-command.ts +11 -7
package/src/commands/clean-command.ts +2 -1
package/src/commands/explore-command.ts +29 -15
package/src/commands/init-command.ts +9 -8
package/src/commands/plan-command.ts +35 -0
package/src/commands/plan-save-command.ts +18 -7
package/src/commands/rerun-command.ts +5 -0
package/src/components/App.tsx +16 -5
package/src/config.ts +6 -1
package/src/execution-controller.ts +14 -3
package/src/experience-tracker.ts +21 -72
package/src/explorbot.ts +5 -8
package/src/explorer.ts +11 -2
package/src/observability.ts +50 -109
package/src/playwright-recorder.ts +305 -0
package/src/test-plan.ts +12 -0
package/src/utils/aria.ts +38 -1
package/src/utils/error-page.ts +22 -7
package/src/utils/next-steps.ts +51 -0

package/dist/src/ai/historian.js CHANGED Viewed

@@ -1,379 +1,31 @@
-import { mkdirSync, readFileSync, writeFileSync } from 'node:fs';
-import { join } from 'node:path';
-import dedent from 'dedent';
-import { z } from 'zod';
-import { ActionResult } from "../action-result.js";
-import { ConfigParser } from "../config.js";
+import { readFileSync, writeFileSync } from 'node:fs';
 import { ExperienceTracker } from "../experience-tracker.js";
-import { KnowledgeTracker } from "../knowledge-tracker.js";
-import { Test } from "../test-plan.js";
-import { createDebug, tag } from "../utils/logger.js";
-import { extractStatePath } from "../utils/url-matcher.js";
-import { ASSERTION_TOOLS, CODECEPT_TOOLS } from "./tools.js";
-const debugLog = createDebug('explorbot:historian');
-export class Historian {
-    provider;
-    experienceTracker;
-    reporter;
-    stateManager;
-    savedFiles = new Set();
-    constructor(provider, experienceTracker, reporter, stateManager) {
+import { tag } from "../utils/logger.js";
+import { relativeToCwd } from "../utils/next-steps.js";
+import { WithCodeceptJS } from "./historian/codeceptjs.js";
+import { WithExperience } from "./historian/experience.js";
+import { WithPlaywright } from "./historian/playwright.js";
+export { isNonReusableCode } from "./historian/utils.js";
+const HistorianBase = WithPlaywright(WithCodeceptJS(WithExperience(Object)));
+export class Historian extends HistorianBase {
+    constructor(provider, experienceTracker, reporter, stateManager, config, recorder) {
+        super();
         this.provider = provider;
         this.experienceTracker = experienceTracker || new ExperienceTracker();
         this.reporter = reporter;
         this.stateManager = stateManager;
+        this.config = config;
+        this.recorder = recorder;
+        this.savedFiles = new Set();
+    }
+    isPlaywrightFramework() {
+        return this.config?.ai?.agents?.historian?.framework === 'playwright';
     }
     getSavedFiles() {
         return [...this.savedFiles];
     }
-    async saveSession(task, initialState, conversation) {
-        debugLog('Saving session experience');
-        const result = this.determineResult(task);
-        const toolExecutions = conversation.getToolExecutions();
-        if (task instanceof Test) {
-            task.generatedCode = this.toCode(conversation, task.description);
-        }
-        const steps = await this.extractSteps(toolExecutions);
-        await this.detectRetryPatterns(toolExecutions, initialState);
-        const verifiedSteps = await this.verifySteps(steps, initialState);
-        if (verifiedSteps.length > 0) {
-            const relatedUrls = this.extractVisitedUrls(toolExecutions, initialState.url || '');
-            this.experienceTracker.writeFlow(initialState, {
-                scenario: task.description,
-                steps: verifiedSteps,
-                relatedUrls,
-            });
-        }
-        if (task instanceof Test && result !== 'failed') {
-            await this.reportSession(task, steps);
-        }
-        tag('substep').log(`Historian saved session for: ${task.description}`);
-    }
-    async reportSession(test, steps) {
-        if (!this.reporter)
-            return;
-        const reporterSteps = steps.map((step) => ({
-            title: step.message,
-            status: step.status === 'passed' ? 'passed' : 'failed',
-            code: step.code ? step.code.split('\n').filter((l) => l.trim()) : [],
-            discovery: step.discovery,
-        }));
-        await this.reporter.reportSteps(test, reporterSteps);
-    }
-    async extractSteps(toolExecutions) {
-        const stepsWithDiffs = [];
-        for (const exec of toolExecutions) {
-            if (!CODECEPT_TOOLS.includes(exec.toolName))
-                continue;
-            if (!exec.output?.code)
-                continue;
-            if (!exec.wasSuccessful)
-                continue;
-            if (isNonReusableCode(exec.output.code))
-                continue;
-            const message = this.getExecutionLabel(exec, `Executed ${exec.toolName}`);
-            const ariaDiff = exec.output?.pageDiff?.ariaChanges || null;
-            const urlChanged = exec.output?.pageDiff?.urlChanged || false;
-            const step = {
-                message,
-                status: 'passed',
-                tool: exec.toolName,
-                code: this.stripComments(exec.output.code),
-            };
-            stepsWithDiffs.push({ step, ariaDiff, urlChanged });
-        }
-        await this.analyzeDiscoveries(stepsWithDiffs);
-        return stepsWithDiffs.map((s) => s.step);
-    }
-    async verifySteps(steps, initialState) {
-        if (steps.length === 0)
-            return [];
-        const existingExperience = this.experienceTracker
-            .getRelevantExperience(initialState)
-            .map((e) => e.content)
-            .filter(Boolean)
-            .join('\n');
-        const existingSummary = existingExperience.length > 2000 ? existingExperience.substring(0, 2000) : existingExperience;
-        const stepsList = steps.map((s, i) => `${i}. ${s.message}\n   Code: ${s.code || 'none'}`).join('\n');
-        const prompt = dedent `
-      Review these test steps and determine which are valuable to save as experience
-      for future test executions on this page.
-      <steps>
-      ${stepsList}
-      </steps>
-      ${existingSummary ? `<existing_experience>\n${existingSummary}\n</existing_experience>` : ''}
-      For each step, determine if it is useful:
-      - NOT useful if it uses auto-generated or unstable locators (ember IDs, numeric data-testid, random IDs)
-      - NOT useful if it is already documented in existing experience
-      - NOT useful if it requires an unclear precondition that would not be reproducible
-      - NOT useful if it is trivial navigation (I.amOnPage) without meaningful context
-      - USEFUL if it demonstrates how to interact with a specific UI component (expand dropdown, fill form, etc)
-      - USEFUL if it shows a working approach for a common task on this page
-    `;
-        const schema = z.object({
-            steps: z.array(z.object({
-                stepIndex: z.number(),
-                useful: z.boolean(),
-            })),
-        });
-        try {
-            const response = await this.provider.generateObject([
-                { role: 'system', content: 'Evaluate test steps for experience value. Be selective — only keep steps that teach something reusable.' },
-                { role: 'user', content: prompt },
-            ], schema, undefined, { telemetryFunctionId: 'historian.verifySteps' });
-            const usefulIndices = new Set((response?.object?.steps || []).filter((s) => s.useful).map((s) => s.stepIndex));
-            const verified = steps.filter((_, i) => usefulIndices.has(i));
-            debugLog('Verified %d/%d steps as useful', verified.length, steps.length);
-            return verified;
-        }
-        catch (error) {
-            debugLog('Step verification failed, keeping all steps: %s', error.message);
-            return steps;
-        }
-    }
-    async detectRetryPatterns(toolExecutions, initialState) {
-        if (!this.experienceTracker || !this.stateManager)
-            return;
-        const failedByTool = new Map();
-        const candidates = [];
-        for (const exec of toolExecutions) {
-            if (!CODECEPT_TOOLS.includes(exec.toolName))
-                continue;
-            if (!exec.output?.code)
-                continue;
-            if (!exec.wasSuccessful) {
-                const bucket = failedByTool.get(exec.toolName) || [];
-                bucket.push(exec);
-                failedByTool.set(exec.toolName, bucket);
-                continue;
-            }
-            const failed = failedByTool.get(exec.toolName);
-            if (failed?.length) {
-                candidates.push({ failed: [...failed], success: exec });
-                failedByTool.set(exec.toolName, []);
-            }
-        }
-        if (candidates.length === 0)
-            return;
-        const prompt = dedent `
-      Analyze these retry patterns where a tool failed multiple times before succeeding.
-      For each candidate, determine which failed attempts were trying to do the same thing as the success.
-      ${candidates
-            .map((c, i) => dedent `
-        Candidate ${i}:
-        Failed attempts:
-        ${c.failed.map((f, j) => `  ${j}: ${this.getExecutionLabel(f, f.toolName)} → code: ${f.output?.code}`).join('\n')}
-        Succeeded:
-          ${this.getExecutionLabel(c.success, c.success.toolName)} → code: ${c.success.output.code}
-      `)
-            .join('\n\n')}
-      For each candidate where failures share the same intent as the success:
-      - candidateIndex: index of the candidate
-      - failedIndices: which failed attempts share the same intent
-      - intent: business-focused description of what was being done
-      - explanation: actionable tip explaining which element works and what to avoid
-    `;
-        const schema = z.object({
-            retryPatterns: z.array(z.object({
-                candidateIndex: z.number(),
-                failedIndices: z.array(z.number()),
-                intent: z.string(),
-                explanation: z.string(),
-            })),
-        });
-        try {
-            const response = await this.provider.generateObject([
-                { role: 'system', content: 'Analyze retry patterns in web testing tool executions. Identify when failed attempts share the same intent as a successful one.' },
-                { role: 'user', content: prompt },
-            ], schema);
-            for (const pattern of response?.object?.retryPatterns || []) {
-                const candidate = candidates[pattern.candidateIndex];
-                if (!candidate)
-                    continue;
-                const url = candidate.success.output?.pageDiff?.currentUrl;
-                let state = initialState;
-                if (url && url !== initialState.url) {
-                    const transition = this.stateManager.getLastVisitToPath(url);
-                    if (transition) {
-                        state = ActionResult.fromState(transition.toState);
-                    }
-                }
-                if (isNonReusableCode(candidate.success.output.code))
-                    continue;
-                this.experienceTracker.writeAction(state, { title: pattern.intent, code: candidate.success.output.code, explanation: pattern.explanation });
-            }
-            debugLog('Detected %d retry patterns', response?.object?.retryPatterns?.length || 0);
-        }
-        catch (error) {
-            debugLog('Failed to detect retry patterns: %s', error.message);
-        }
-    }
-    async analyzeDiscoveries(stepsWithDiffs) {
-        if (!stepsWithDiffs.some((s) => s.ariaDiff))
-            return;
-        const prompt = this.buildDiscoveryPrompt(stepsWithDiffs);
-        const schema = z.object({
-            discoveries: z.array(z.object({
-                stepNumber: z.number(),
-                discoveries: z.array(z.string()),
-            })),
-        });
-        try {
-            const response = await this.provider.generateObject([
-                { role: 'system', content: 'Analyze test execution steps and identify valuable UI discoveries. Return multiple discoveries per step when multiple new elements appear. Return no discoveries for steps with no meaningful changes.' },
-                { role: 'user', content: prompt },
-            ], schema);
-            for (const { stepNumber, discoveries } of response?.object?.discoveries || []) {
-                const stepIndex = stepNumber - 1;
-                if (!stepsWithDiffs[stepIndex])
-                    continue;
-                if (discoveries.length === 0)
-                    continue;
-                stepsWithDiffs[stepIndex].step.discovery = discoveries.join('\n');
-            }
-        }
-        catch (error) {
-            debugLog('Failed to analyze discoveries: %s', error.message);
-        }
-    }
-    buildDiscoveryPrompt(stepsWithDiffs) {
-        let prompt = dedent `
-      Review these test steps and their ARIA diffs. Identify new UI elements that appeared
-      which could be valuable for:
-      - Deeper testing of this feature
-      - Related features that can be triggered from this flow
-      IMPORTANT:
-      - Return MULTIPLE discoveries per step when multiple new elements appear (e.g., if 3 buttons appeared, return an array with 3 discoveries for that step)
-      - Return NO discoveries (empty array) for a step if nothing new appeared or if elements were already discovered in previous steps
-      - Only include steps that have discoveries
-      Steps:
-    `;
-        for (let i = 0; i < stepsWithDiffs.length; i++) {
-            const { step, ariaDiff, urlChanged } = stepsWithDiffs[i];
-            prompt += `\n\nStep ${i + 1}: ${step.message}`;
-            if (ariaDiff) {
-                prompt += `\n${ariaDiff}`;
-            }
-        }
-        prompt += dedent `
-      Return discoveries in format:
-      - stepNumber: which step revealed these elements
-      - discoveries: array of brief descriptions like ["A new button appeared: Publish To Twitter", "A new input field appeared: Description"]
-      Only return elements that are actionable and could lead to new test scenarios.
-      Ignore generic UI changes (loading spinners, timestamps, etc).
-      If errors or warnings appeared in the step, include them in the discoveries array.
-      If multiple buttons, inputs, links, or other actionable elements appeared in the same step, include all of them in the discoveries array.
-    `;
-        return prompt;
-    }
-    determineResult(task) {
-        if ('isSuccessful' in task && task.isSuccessful)
-            return 'success';
-        if ('hasAchievedAny' in task && task.hasAchievedAny())
-            return 'partial';
-        const hasPassedNotes = Object.values(task.notes).some((n) => n.status === 'passed');
-        if (hasPassedNotes)
-            return 'partial';
-        return 'failed';
-    }
-    extractVisitedUrls(toolExecutions, initialUrl) {
-        const urls = new Set();
-        const initialPath = extractStatePath(initialUrl);
-        for (const exec of toolExecutions) {
-            const currentUrl = exec.output?.pageDiff?.currentUrl;
-            if (!currentUrl)
-                continue;
-            const relativePath = extractStatePath(currentUrl);
-            if (relativePath && relativePath !== initialPath) {
-                urls.add(relativePath);
-            }
-        }
-        return [...urls];
-    }
-    toCode(conversation, scenario) {
-        const toolExecutions = conversation.getToolExecutions();
-        const TRACKABLE_TOOLS = [...CODECEPT_TOOLS, ...ASSERTION_TOOLS];
-        const successfulSteps = toolExecutions.filter((exec) => exec.wasSuccessful && TRACKABLE_TOOLS.includes(exec.toolName) && exec.output?.code);
-        if (successfulSteps.length === 0) {
-            return '';
-        }
-        const lines = [];
-        lines.push(`Scenario('${this.escapeString(scenario)}', ({ I }) => {`);
-        for (const exec of successfulSteps) {
-            if (isNonReusableCode(exec.output.code))
-                continue;
-            const explanation = this.getExecutionLabel(exec);
-            if (explanation) {
-                lines.push('');
-                lines.push(`  Section('${this.escapeString(explanation)}');`);
-            }
-            const code = this.stripComments(exec.output.code);
-            const codeLines = code.includes('\n') ? code.split('\n') : code.split('; ');
-            for (const codeLine of codeLines) {
-                const trimmed = codeLine.trim();
-                if (trimmed) {
-                    lines.push(`  ${trimmed}`);
-                }
-            }
-        }
-        lines.push('});');
-        return lines.join('\n');
-    }
     savePlanToFile(plan) {
-        const lines = [];
-        lines.push(`import step, { Section } from 'codeceptjs/steps';`);
-        lines.push('');
-        lines.push(`Feature('${this.escapeString(plan.title)}')`);
-        lines.push('');
-        const startUrl = plan.url || plan.tests[0]?.startUrl;
-        if (startUrl) {
-            lines.push('Before(({ I }) => {');
-            lines.push(`  I.amOnPage('${this.escapeString(startUrl)}');`);
-            lines.push(...this.getKnowledgeLines(startUrl));
-            lines.push('});');
-            lines.push('');
-        }
-        for (const test of plan.tests) {
-            if (test.generatedCode) {
-                if (test.isSuccessful) {
-                    lines.push(test.generatedCode);
-                }
-                else {
-                    lines.push(`// FAILED: ${test.scenario}`);
-                    lines.push(test.generatedCode.replace(/Scenario\(/, 'Scenario.skip('));
-                }
-                lines.push('');
-                continue;
-            }
-            lines.push(`Scenario.todo('${this.escapeString(test.scenario)}', ({ I }) => {`);
-            if (test.plannedSteps.length > 0) {
-                for (const step of test.plannedSteps) {
-                    lines.push(`  // ${step}`);
-                }
-            }
-            else {
-                lines.push(`  // ${test.scenario}`);
-            }
-            lines.push('});');
-            lines.push('');
-        }
-        const testsDir = ConfigParser.getInstance().getTestsDir();
-        mkdirSync(testsDir, { recursive: true });
-        const filename = plan.title.replace(/[^a-zA-Z0-9]/g, '_').toLowerCase();
-        const filePath = join(testsDir, `${filename}.js`);
-        writeFileSync(filePath, lines.join('\n'));
-        this.savedFiles.add(filePath);
-        tag('substep').log(`Saved plan tests to: ${filePath}`);
-        return filePath;
+        return this.isPlaywrightFramework() ? this.savePlaywrightPlanToFile(plan) : this.saveCodeceptPlanToFile(plan);
     }
     rewriteScenarioInFile(filePath, healedSteps) {
         let content = readFileSync(filePath, 'utf-8');
@@ -384,44 +36,6 @@ export class Historian {
         }
         writeFileSync(filePath, content);
         this.savedFiles.add(filePath);
-        tag('substep').log(`Updated test file with healed steps: ${filePath}`);
+        tag('substep').log(`Updated test file with healed steps: ${relativeToCwd(filePath)}`);
     }
-    getExecutionLabel(exec, fallback) {
-        return exec.input?.explanation || exec.input?.assertion || exec.input?.note || fallback || '';
-    }
-    escapeString(str) {
-        return str.replace(/'/g, "\\'").replace(/\n/g, ' ');
-    }
-    getKnowledgeLines(url, indent = '  ') {
-        const knowledgeTracker = new KnowledgeTracker();
-        const state = new ActionResult({ url });
-        const { wait, waitForElement, code } = knowledgeTracker.getStateParameters(state, ['wait', 'waitForElement', 'code']);
-        const lines = [];
-        if (wait !== undefined) {
-            lines.push(`${indent}I.wait(${wait});`);
-        }
-        if (waitForElement) {
-            lines.push(`${indent}I.waitForElement(${JSON.stringify(waitForElement)});`);
-        }
-        if (code) {
-            for (const codeLine of code.split('\n')) {
-                const trimmed = codeLine.trim();
-                if (trimmed)
-                    lines.push(`${indent}${trimmed}`);
-            }
-        }
-        return lines;
-    }
-    stripComments(code) {
-        return code
-            .split('\n')
-            .filter((line) => {
-            const trimmed = line.trim();
-            return trimmed && !trimmed.startsWith('//') && !trimmed.startsWith('/*') && !trimmed.startsWith('*');
-        })
-            .join('\n');
-    }
-}
-export function isNonReusableCode(code) {
-    return /\bI\.clickXY\s*\(/.test(code);
 }

package/dist/src/ai/navigator.js CHANGED Viewed

@@ -8,8 +8,9 @@ import { HooksRunner } from "../utils/hooks-runner.js";
 import { createDebug, pluralize, tag } from '../utils/logger.js';
 import { loop, pause } from '../utils/loop.js';
 import { RulesLoader } from "../utils/rules-loader.js";
+import { extractStatePath } from '../utils/url-matcher.js';
 import { Researcher } from "./researcher.js";
-import { actionRule, locatorRule } from './rules.js';
+import { actionRule, locatorRule, unexpectedPopupRule } from './rules.js';
 import { isInteractive } from './task-agent.js';
 import { createAgentTools } from "./tools.js";
 const debugLog = createDebug('explorbot:navigator');
@@ -131,11 +132,10 @@ class Navigator {
       </hint>`;
         }
         if (!actionResult.isInsideIframe) {
-            const toc = this.experienceTracker.getExperienceTableOfContents(actionResult);
-            if (toc.length > 0) {
-                const totalSections = toc.reduce((sum, entry) => sum + entry.sections.length, 0);
-                tag('substep').log(`Found ${toc.length} experience ${pluralize(toc.length, 'file')} (${totalSections} sections) for: ${actionResult.url}`);
-                experience = renderExperienceToc(toc);
+            const successful = this.experienceTracker.getSuccessfulExperience(actionResult);
+            if (successful.length > 0) {
+                tag('substep').log(`Found ${successful.length} experience ${pluralize(successful.length, 'file')} for: ${actionResult.url}`);
+                experience = `<experience>\nPast successful recipes recorded from prior runs for this page. Prefer these solutions first if they match the goal.\n\n${successful.join('\n\n')}\n</experience>`;
             }
         }
         const prompt = dedent `
@@ -163,6 +163,8 @@ class Navigator {
       ${actionRule}
+      ${unexpectedPopupRule}
       ${RulesLoader.loadRules('navigator', ['multiple-locator', 'output'], actionResult.url || '').replace('{{maxAttempts}}', String(this.MAX_ATTEMPTS))}
       ${experience}
@@ -171,11 +173,13 @@ class Navigator {
     `;
         const conversation = this.provider.startConversation(this.systemPrompt, 'navigator');
         conversation.addUserText(prompt);
-        const tools = this.buildExperienceTools();
+        const tools = undefined;
         let codeBlocks = [];
         let htmlContextAdded = false;
         let codeBlockIndex = 0;
         let totalAttempts = 0;
+        const progressBlocks = [];
+        const batchFailures = [];
         let resolved = false;
         await loop(async ({ stop }) => {
             if (codeBlocks.length === 0) {
@@ -194,43 +198,90 @@ class Navigator {
             }
             const codeBlock = codeBlocks[codeBlockIndex];
             if (!codeBlock) {
+                if (batchFailures.length === 0 && htmlContextAdded) {
+                    stop();
+                    return;
+                }
+                tag('substep').log('Feeding failures back to AI for a new batch...');
+                let contextMsg = 'Previous solutions did not work. Analyze the failures and try DIFFERENT strategies (not syntactic variants of the same locator).\n\n';
+                if (batchFailures.length > 0) {
+                    const lines = batchFailures.map((f) => `- \`${f.code.split('\n')[0]}\` → ${f.error}`).join('\n');
+                    contextMsg += `<previous_failures>\n${lines}\n</previous_failures>\n\n`;
+                }
                 if (!htmlContextAdded) {
                     htmlContextAdded = true;
-                    tag('substep').log('Adding HTML context for better resolution...');
-                    conversation.addUserText(dedent `
-              Previous solutions did not work. Here is the full HTML context:
-              <page_html>
-              ${await actionResult.combinedHtml()}
-              </page_html>
-              Please suggest new solutions based on this additional context.
-            `);
-                    codeBlocks = [];
-                    return;
+                    contextMsg += `Full HTML context:\n\n<page_html>\n${await actionResult.combinedHtml()}\n</page_html>\n\n`;
                 }
-                stop();
+                contextMsg += 'Propose new solutions. If errors mention "intercepts pointer events" or timeouts on visible elements, an overlay is blocking — dismiss it first (Escape, click outside, Close button) before retrying the original action.';
+                conversation.addUserText(contextMsg);
+                codeBlocks = [];
+                batchFailures.length = 0;
                 return;
             }
             codeBlockIndex++;
             totalAttempts++;
             await this.explorer.switchToMainFrame();
+            const prevHash = action.actionResult?.getStateHash() ?? actionResult.getStateHash();
             debugLog(`Attempting resolution: ${codeBlock}`);
-            resolved = await action.attempt(codeBlock, message);
+            const attemptOk = await action.attempt(codeBlock, message);
+            const page = action.playwrightHelper?.page;
+            if (page) {
+                try {
+                    await page.waitForLoadState('load', { timeout: 5000 });
+                }
+                catch {
+                    // Navigation did not reach 'load' state within timeout; continue and verify URL
+                }
+            }
+            if (!attemptOk) {
+                const raw = action.lastError?.message || 'attempt failed';
+                const firstMeaningful = raw.split('\n').find((l) => l.trim() && !l.trim().startsWith('at ')) || raw;
+                const shortErr = firstMeaningful.replace(/\s+/g, ' ').trim().slice(0, 220);
+                batchFailures.push({ code: codeBlock, error: shortErr });
+            }
             if (expectedUrl) {
-                await action.getActor().wait(2);
-                const freshState = await action.capturePageState();
-                if (normalizeUrl(freshState.url || '') === normalizeUrl(expectedUrl)) {
-                    resolved = true;
+                if (page) {
+                    try {
+                        await page.waitForURL((url) => normalizeUrl(url.pathname) === normalizeUrl(expectedUrl), { timeout: 5000 });
+                    }
+                    catch {
+                        // URL did not transition to expectedUrl within timeout
+                    }
                 }
-                else if (resolved) {
+                const freshState = await action.capturePageState();
+                const urlMatches = normalizeUrl(freshState.url || '') === normalizeUrl(expectedUrl);
+                const stateChanged = freshState.getStateHash() !== actionResult.getStateHash();
+                resolved = urlMatches && stateChanged;
+                if (!resolved && attemptOk) {
                     tag('warning').log(`URL verification failed: expected ${expectedUrl}, got ${freshState.url}`);
-                    resolved = false;
+                }
+                if (freshState.getStateHash() !== prevHash && (attemptOk || urlMatches)) {
+                    progressBlocks.push(codeBlock);
                 }
             }
+            else {
+                resolved = attemptOk;
+                if (attemptOk)
+                    progressBlocks.push(codeBlock);
+            }
             if (resolved) {
                 tag('success').log('Navigation resolved successfully');
-                this.experienceTracker.writeAction(actionResult, { title: message, code: codeBlock });
+                let scenario = message.split('\n')[0];
+                if (expectedUrl) {
+                    const fromPath = extractStatePath(actionResult.url || '');
+                    const toPath = extractStatePath(expectedUrl);
+                    scenario = `reach ${toPath} from ${fromPath}`;
+                }
+                const recipe = progressBlocks
+                    .join('\n')
+                    .split('\n')
+                    .filter((line) => !/^\s*I\.amOnPage\s*\(/.test(line))
+                    .join('\n')
+                    .trim();
+                if (recipe) {
+                    const body = `## FLOW: ${scenario}\n\n* ${scenario}\n\n\`\`\`js\n${recipe}\n\`\`\`\n\n---\n`;
+                    this.experienceTracker.writeFlow(actionResult, body);
+                }
                 stop();
                 return;
             }
@@ -455,6 +506,7 @@ class Navigator {
         const tools = this.buildExperienceTools();
         let codeBlocks = [];
         const successfulCodes = [];
+        const assertionSteps = [];
         const action = this.explorer.createAction();
         await loop(async ({ stop, iteration }) => {
             if (codeBlocks.length === 0) {
@@ -479,6 +531,7 @@ class Navigator {
             if (verified) {
                 tag('success').log('Verification passed');
                 successfulCodes.push(codeBlock);
+                assertionSteps.push(...action.assertionSteps);
             }
         }, {
             maxAttempts: this.MAX_ATTEMPTS,
@@ -493,7 +546,7 @@ class Navigator {
         const verified = totalAttempted <= 1 ? successfulCodes.length > 0 : successfulCodes.length > totalAttempted / 2;
         actionResult.addVerification(message, verified);
         this.explorer.getStateManager().updateState(actionResult);
-        return { verified, successfulCodes, totalAttempted };
+        return { verified, successfulCodes, assertionSteps, totalAttempted };
     }
 }
 export { Navigator };