npm - explorbot - Versions diffs - 0.1.18 → 0.1.20 - Mend

explorbot 0.1.18 → 0.1.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

package/bin/explorbot-cli.ts +19 -1
package/dist/bin/explorbot-cli.js +16 -1
package/dist/package.json +1 -1
package/dist/src/action.js +8 -3
package/dist/src/ai/driller.js +1 -1
package/dist/src/ai/navigator.js +43 -2
package/dist/src/ai/pilot.js +5 -0
package/dist/src/ai/planner.js +21 -5
package/dist/src/ai/rerunner.js +1 -1
package/dist/src/ai/researcher/deep-analysis.js +22 -7
package/dist/src/ai/researcher.js +10 -5
package/dist/src/ai/session-analyst.js +24 -0
package/dist/src/ai/tester.js +3 -3
package/dist/src/ai/tools.js +3 -2
package/dist/src/commands/explore-command.js +5 -1
package/dist/src/components/LogPane.js +34 -4
package/package.json +1 -1
package/src/action.ts +8 -3
package/src/ai/driller.ts +1 -1
package/src/ai/navigator.ts +43 -2
package/src/ai/pilot.ts +5 -0
package/src/ai/planner.ts +22 -5
package/src/ai/rerunner.ts +1 -1
package/src/ai/researcher/deep-analysis.ts +20 -7
package/src/ai/researcher.ts +9 -5
package/src/ai/session-analyst.ts +24 -0
package/src/ai/tester.ts +3 -3
package/src/ai/tools.ts +3 -2
package/src/commands/explore-command.ts +6 -1
package/src/components/LogPane.tsx +42 -9

package/bin/explorbot-cli.ts CHANGED Viewed

@@ -43,6 +43,8 @@ interface CLIOptions {
 }
 function buildExplorBotOptions(from: string | undefined, options: CLIOptions): ExplorBotOptions {
+  const sessionFile = options.session === true ? path.join(path.resolve(options.path || process.cwd()), 'output', 'session.json') : options.session;
   return {
     from,
     verbose: options.verbose || options.debug,
@@ -51,7 +53,7 @@ function buildExplorBotOptions(from: string | undefined, options: CLIOptions): E
     show: options.show,
     headless: options.headless,
     incognito: options.incognito,
-    session: options.session === true ? 'output/session.json' : options.session,
+    session: sessionFile,
   } as ExplorBotOptions;
 }
@@ -597,6 +599,22 @@ addCommonOptions(program.command('research <url>').description('Research a page
   }
 );
+addCommonOptions(program.command('navigate <url>').description('Navigate to a URL using the AI Navigator. Exits 0 if reachable, 1 otherwise.')).action(async (url, options) => {
+  try {
+    const explorBot = new ExplorBot(buildExplorBotOptions(url, options));
+    await explorBot.start();
+    const { NavigateCommand } = await import('../src/commands/navigate-command.js');
+    await new NavigateCommand(explorBot).execute(url);
+    await explorBot.stop();
+    await showStatsAndExit(0);
+  } catch (error) {
+    console.error('Failed:', error instanceof Error ? error.message : 'Unknown error');
+    await showStatsAndExit(1);
+  }
+});
 addCommonOptions(
   program.command('drill <url>').alias('driller').description('Drill all components on a page to learn interactions').option('--knowledge <path>', 'Save learned interactions to knowledge file at this URL path').option('--max-components <count>', 'Maximum number of components to drill')
 ).action(async (url, options) => {

package/dist/bin/explorbot-cli.js CHANGED Viewed

@@ -27,6 +27,7 @@ if (!process.env.EXPLORBOT_NO_BANNER) {
     console.log(`⛵ ${chalk.yellow.bold(`Explorbot v${pkgVersion}`)} ${chalk.dim('Autonomous Testing Agent')}`);
 }
 function buildExplorBotOptions(from, options) {
+    const sessionFile = options.session === true ? path.join(path.resolve(options.path || process.cwd()), 'output', 'session.json') : options.session;
     return {
         from,
         verbose: options.verbose || options.debug,
@@ -35,7 +36,7 @@ function buildExplorBotOptions(from, options) {
         show: options.show,
         headless: options.headless,
         incognito: options.incognito,
-        session: options.session === true ? 'output/session.json' : options.session,
+        session: sessionFile,
     };
 }
 function addCommonOptions(cmd) {
@@ -543,6 +544,20 @@ addCommonOptions(program.command('research <url>').description('Research a page
         await showStatsAndExit(1);
     }
 });
+addCommonOptions(program.command('navigate <url>').description('Navigate to a URL using the AI Navigator. Exits 0 if reachable, 1 otherwise.')).action(async (url, options) => {
+    try {
+        const explorBot = new ExplorBot(buildExplorBotOptions(url, options));
+        await explorBot.start();
+        const { NavigateCommand } = await import('../src/commands/navigate-command.js');
+        await new NavigateCommand(explorBot).execute(url);
+        await explorBot.stop();
+        await showStatsAndExit(0);
+    }
+    catch (error) {
+        console.error('Failed:', error instanceof Error ? error.message : 'Unknown error');
+        await showStatsAndExit(1);
+    }
+});
 addCommonOptions(program.command('drill <url>').alias('driller').description('Drill all components on a page to learn interactions').option('--knowledge <path>', 'Save learned interactions to knowledge file at this URL path').option('--max-components <count>', 'Maximum number of components to drill')).action(async (url, options) => {
     try {
         const explorBot = new ExplorBot(buildExplorBotOptions(url, options));

package/dist/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "explorbot",
-  "version": "0.1.18",
+  "version": "0.1.20",
   "description": "CLI app built with React Ink, CodeceptJS, and Playwright",
   "license": "Elastic-2.0",
   "type": "module",

package/dist/src/action.js CHANGED Viewed

@@ -2,7 +2,6 @@ import fs from 'node:fs';
 import { join } from 'node:path';
 import { faker } from '@faker-js/faker';
 import { context, trace } from '@opentelemetry/api';
-import { highlight } from 'cli-highlight';
 import { container, recorder } from 'codeceptjs';
 import * as codeceptjs from 'codeceptjs';
 import { hopeThat, retryTo, tryTo, within } from 'codeceptjs/lib/effects';
@@ -12,7 +11,7 @@ import { clearActivity, setActivity } from "./activity.js";
 import { ConfigParser, outputPath } from './config.js';
 import { Observability } from "./observability.js";
 import { htmlCombinedSnapshot, minifyHtml } from './utils/html.js';
-import { createDebug, log, setStepSpanParent, tag } from './utils/logger.js';
+import { createDebug, setStepSpanParent, tag } from './utils/logger.js';
 import { safeFilename } from "./utils/strings.js";
 const debugLog = createDebug('explorbot:action');
 const FATAL_BROWSER_ERRORS = /Frame was detached|Target closed|Execution context was destroyed|Protocol error|Session closed/i;
@@ -257,7 +256,13 @@ class Action {
     async expect(codeOrFunction) {
         const codeString = typeof codeOrFunction === 'string' ? codeOrFunction : codeOrFunction.toString();
         this.expectation = codeString.toString();
-        log('Expecting', highlight(codeString, { language: 'javascript' }));
+        const expectationPreview = sanitizeCodeBlock(codeString)
+            .split('\n')
+            .map((line) => line.trim())
+            .filter(Boolean)
+            .slice(0, 2)
+            .join(' ');
+        tag('step').log(`Expecting: ${expectationPreview || 'assertion'}`);
         try {
             debugLog('Executing expectation:', codeString);
             let codeFunction;

package/dist/src/ai/driller.js CHANGED Viewed

@@ -96,7 +96,7 @@ export class Driller extends TaskAgent {
         const sessionName = `driller_${Date.now().toString(36)}`;
         this.allResults = [];
         return Observability.run(`driller: ${currentState.url}`, { tags: ['driller'], sessionId: sessionName }, async () => {
-            tag('info').log(`Driller starting on ${currentState.url}`);
+            tag('step').log(`Drilling page: ${currentState.url}`);
             await this.hooksRunner.runBeforeHook('driller', currentState.url);
             const originalState = await this.captureAnnotatedState();
             const components = await this.collectComponents(originalState, maxComponents);

package/dist/src/ai/navigator.js CHANGED Viewed

@@ -68,8 +68,48 @@ class Navigator {
         this.experienceTracker = experienceTracker || new ExperienceTracker();
         this.hooksRunner = new HooksRunner(explorer, explorer.getConfig());
     }
+    getBaseOrigin() {
+        const baseUrl = this.explorer.getConfig().playwright.url;
+        try {
+            return new URL(baseUrl).origin;
+        }
+        catch {
+            return null;
+        }
+    }
+    getComparableCurrentUrl(stateManager, expectedUrl) {
+        const currentState = stateManager.getCurrentState();
+        if (!currentState)
+            return '';
+        const current = /^https?:\/\//i.test(expectedUrl) ? currentState.fullUrl || currentState.url || '' : currentState.url || '';
+        return current;
+    }
+    isSameExpectedOrigin(expectedUrl, stateManager) {
+        const currentState = stateManager.getCurrentState();
+        if (!currentState)
+            return false;
+        const currentFullUrl = currentState.fullUrl || currentState.url || '';
+        if (!currentFullUrl)
+            return false;
+        try {
+            const currentOrigin = new URL(currentFullUrl).origin;
+            if (/^https?:\/\//i.test(expectedUrl)) {
+                return currentOrigin === new URL(expectedUrl).origin;
+            }
+            const baseOrigin = this.getBaseOrigin();
+            if (!baseOrigin)
+                return true;
+            return currentOrigin === baseOrigin;
+        }
+        catch {
+            return !/^https?:\/\//i.test(expectedUrl);
+        }
+    }
     isOnExpectedPage(expectedUrl, stateManager) {
-        const currentUrl = stateManager.getCurrentState()?.url || '';
+        if (!this.isSameExpectedOrigin(expectedUrl, stateManager)) {
+            return false;
+        }
+        const currentUrl = this.getComparableCurrentUrl(stateManager, expectedUrl);
         return normalizeUrl(currentUrl) === normalizeUrl(expectedUrl);
     }
     async visit(url) {
@@ -249,7 +289,8 @@ class Navigator {
                     }
                 }
                 const freshState = await action.capturePageState();
-                const urlMatches = normalizeUrl(freshState.url || '') === normalizeUrl(expectedUrl);
+                const currentUrl = /^https?:\/\//i.test(expectedUrl) ? freshState.fullUrl || freshState.url || '' : freshState.url || '';
+                const urlMatches = this.isSameExpectedOrigin(expectedUrl, action.stateManager) && normalizeUrl(currentUrl) === normalizeUrl(expectedUrl);
                 const stateChanged = freshState.getStateHash() !== actionResult.getStateHash();
                 resolved = urlMatches && stateChanged;
                 if (!resolved && attemptOk) {

package/dist/src/ai/pilot.js CHANGED Viewed

@@ -270,6 +270,9 @@ export class Pilot {
       overrides the others — weigh them together. Tester's record() notes are the LEAST reliable; always
       cross-check against actual actions and state. Visual screenshot analysis is strong for UI state
       (active tabs, visible counts, colors).
+      If the final page clearly shows an equivalent success state in a different UI form, do not fail only
+      because one narrow assertion targeted a specific badge, count, toast, or wording that the product
+      represents differently.
       SCENARIO TITLE defines what must happen. Action verbs require persisted evidence:
       - "Create X" → X must exist (visible, redirected to its page, or success message). Opening a form is NOT enough.
@@ -311,6 +314,8 @@ export class Pilot {
       GUIDANCE (required for "continue"): a specific next action on the current page — which tool, what
       to verify, how to record. Do not suggest repeating actions that already succeeded.
+      If progress is blocked only because the page lacks target data for the scenario, prefer precondition()
+      over repeated UI attempts.
     `;
     }
     buildVerdictSystemPrompt(type, task) {

package/dist/src/ai/planner.js CHANGED Viewed

@@ -64,6 +64,9 @@ export class Planner extends PlannerBase {
     get sectionOrder() {
         return ConfigParser.getInstance().getConfig().ai?.agents?.researcher?.sections || Object.keys(POSSIBLE_SECTIONS);
     }
+    getDefaultStartUrl(state) {
+        return state.fullUrl || state.url;
+    }
     getSystemMessage(feature) {
         const currentUrl = this.stateManager.getCurrentState()?.url;
         const customPrompt = this.provider.getSystemPromptForAgent('planner', currentUrl);
@@ -138,7 +141,6 @@ export class Planner extends PlannerBase {
         }
         this.freshStart = false;
         setActivity(`${this.emoji} Planning...`, 'action');
-        tag('info').log(`Planning test scenarios for ${state.url}`);
         if (style)
             tag('info').log(`Planning style: ${style}`);
         const tags = ['planner'];
@@ -162,7 +164,8 @@ export class Planner extends PlannerBase {
             if (aiResult.object.scenarios.length === 0 && !this.currentPlan) {
                 throw new Error('No tasks were created successfully');
             }
-            const fromPlanning = aiResult.object.scenarios.map((s) => new Test(s.scenario, s.priority, s.expectedOutcomes, s.startUrl || state.url, s.steps || []));
+            const defaultStartUrl = this.getDefaultStartUrl(state);
+            const fromPlanning = aiResult.object.scenarios.map((s) => new Test(s.scenario, s.priority, s.expectedOutcomes, s.startUrl || defaultStartUrl, s.steps || []));
             return { tests: fromPlanning, planName: aiResult.object.planName };
         });
         const tests = result.tests;
@@ -171,7 +174,8 @@ export class Planner extends PlannerBase {
             const cached = state.url ? getRegisteredPlan(state.url) : null;
             const planName = feature || cached?.plan.title || result.planName || state.url;
             this.currentPlan = new Plan(planName);
-            this.currentPlan.url = state.url;
+            this.currentPlan.url = this.getDefaultStartUrl(state);
+            const defaultStartUrl = this.getDefaultStartUrl(state);
             if (parentPlan)
                 this.currentPlan.parentPlan = parentPlan;
             const allPreviousScenarios = this.getPreviousSessionScenarios();
@@ -182,14 +186,14 @@ export class Planner extends PlannerBase {
                 if (allPreviousScenarios.has(t.scenario.toLowerCase()))
                     continue;
                 t.style = this.lastStyleName;
-                t.startUrl = state.url;
+                t.startUrl = defaultStartUrl;
                 this.currentPlan.addTest(t);
             }
         }
         else {
             tag('step').log(`Expanding plan: "${this.currentPlan.title}"`);
             this.currentPlan.nextIteration();
-            const newTests = this.addNewTests(tests, state.url);
+            const newTests = this.addNewTests(tests, this.getDefaultStartUrl(state));
             if (newTests.length > 0) {
                 const summary = `New scenarios:\n${newTests.map((t) => `+ [${t.priority}] ${t.scenario}`).join('\n')}`;
                 tag('multiline').log(summary);
@@ -292,6 +296,13 @@ export class Planner extends PlannerBase {
       Focus on URL page change or data persistency after page reload.
       If there are subpages (pages with same URL path) plan testing of those subpages as well
       If you plan to test CRUD operations, plan them in correct order: create, read, update.
+      Do not invent specific route names, success messages, validation texts, badge counts, or welcome messages unless they are visible in research, visited pages, or prior observed flows.
+      If exact wording is unknown, describe the expected result generically, for example "an authentication error is shown" or "the user stays on the login page" instead of guessing the literal text.
+      If exact redirect destination is unknown, describe the destination by visible page identity, for example "the dashboard page opens" or "the current workspace home page opens" instead of inventing a URL slug.
+      Only propose scenarios whose prerequisites are evident from page research, visited pages, or API data preparation context.
+      If a scenario needs existing records, recipients, results, notifications, or other target data, propose it only when that data is visible or API preconditions can create it.
+      If the page appears read-only, degraded, demo-limited, maintenance-like, or lacks write controls, prefer read-only scenarios such as opening panels, inspecting visible lists, filtering, searching, or verifying current state.
+      Do not assume hidden data exists just because a control is present.
       DO NOT propose "verification-only" tests that merely open a UI element (modal, dropdown, panel) and check it exists.
       Every test must complete a meaningful action that changes application state or produces a business outcome.
       Opening a modal is NOT a test — performing an action INSIDE the modal IS a test.
@@ -516,10 +527,15 @@ export class Planner extends PlannerBase {
          - Good: "New suite 'My New Suite' appears in the suite list"
          - Good: "Suite appears under Starred filter tab"
          - Good: "Success message 'Suite created' is displayed"
+         - Good when wording is unknown: "An authentication error is displayed"
+         - Good when route is unknown: "The workspace home page is displayed"
          - Bad: "Modal is displayed" (just verifying existence, no business value)
          - Bad: "Dropdown menu is visible" (just verifying existence)
+         - Bad: "Welcome message is displayed" if no welcome message is visible in research
+         - Bad: "Redirected to /dashboard" if no such route was observed
          - Each outcome should be independently verifiable
          - Avoid combining multiple checks into one outcome
+         - Prefer durable user-facing results over fragile micro-signals
          - Expected outcomes describe WHAT TO VERIFY
          FORMATTING RULES:

package/dist/src/ai/rerunner.js CHANGED Viewed

@@ -67,7 +67,7 @@ export class Rerunner extends TaskAgent {
             tag('error').log(`Test file not found: ${absPath}`);
             return { total: 0, passed: 0, failed: 0, healed: 0 };
         }
-        tag('info').log(`Re-running tests from: ${relative(process.cwd(), absPath)}`);
+        tag('step').log(`Re-running tests from: ${relative(process.cwd(), absPath)}`);
         setActivity('🔄 Re-running tests...', 'action');
         this.healedSteps = [];
         this.setupPlugins();

package/dist/src/ai/researcher/deep-analysis.js CHANGED Viewed

@@ -12,7 +12,7 @@ export function WithDeepAnalysis(Base) {
     return class extends Base {
         async performDeepAnalysis(state, result) {
             tag('info').log('Starting deep analysis of expandable elements');
-            await this.navigateTo(state.url);
+            await this.navigateTo(state.fullUrl || state.url);
             let expandables = await this._discoverExpandables(result.text);
             if (expandables.length === 0) {
                 tag('info').log('No expandable elements identified by AI');
@@ -21,7 +21,7 @@ export function WithDeepAnalysis(Base) {
             tag('substep').log(`Identified ${expandables.length} expandable elements`);
             const maxClicks = this.explorer.getConfig().ai?.agents?.researcher?.maxExpandableClicks ?? DEFAULT_MAX_EXPANDABLE_CLICKS;
             if (expandables.length > maxClicks) {
-                expandables = await this._selectExpandables(expandables, state.url, maxClicks);
+                expandables = await this._selectExpandables(expandables, state.fullUrl || state.url, maxClicks);
                 tag('substep').log(`Selected ${expandables.length} expandables to click (max: ${maxClicks})`);
             }
             const elements = expandables
@@ -144,7 +144,15 @@ export function WithDeepAnalysis(Base) {
         `;
                 visionCall = this.provider.processImage(visionPrompt, screenshot.toString('base64'));
             }
-            const [textRes, visionRes] = await Promise.all([textCall, visionCall]);
+            let textRes = null;
+            let visionRes = null;
+            try {
+                [textRes, visionRes] = await Promise.all([textCall, visionCall]);
+            }
+            catch (err) {
+                tag('warning').log(`Expandable discovery failed, skipping deep analysis: ${err instanceof Error ? err.message : err}`);
+                return [];
+            }
             const eidxSet = new Set();
             const parseRefs = (text) => {
                 if (!text)
@@ -204,10 +212,17 @@ export function WithDeepAnalysis(Base) {
         - Respond with comma-separated numbers to keep, e.g.: 1, 3, 5
       `;
             const model = this.provider.getModelForAgent('researcher');
-            const r = await this.provider.chat([{ role: 'user', content: prompt }], model, {
-                agentName: 'researcher',
-                telemetryFunctionId: 'researcher.selectExpandables',
-            });
+            let r;
+            try {
+                r = await this.provider.chat([{ role: 'user', content: prompt }], model, {
+                    agentName: 'researcher',
+                    telemetryFunctionId: 'researcher.selectExpandables',
+                });
+            }
+            catch (err) {
+                tag('warning').log(`Expandable selection failed, using first ${maxClicks}: ${err instanceof Error ? err.message : err}`);
+                return expandables.slice(0, maxClicks);
+            }
             const nums = (r.text || '').match(/\d+/g)?.map(Number) || [];
             const selected = expandables.filter((_, i) => nums.includes(i + 1));
             return selected.length > 0 ? selected.slice(0, maxClicks) : expandables.slice(0, maxClicks);

package/dist/src/ai/researcher.js CHANGED Viewed

@@ -93,7 +93,7 @@ export class Researcher extends ResearcherBase {
             const displayUrl = state.fullUrl || state.url;
             tag('info').log(`Researching ${displayUrl} to understand the context...`);
             setActivity(`${this.emoji} Researching...`, 'action');
-            await this.ensureNavigated(state.url, screenshot && this.provider.hasVision());
+            await this.ensureNavigated(displayUrl, screenshot && this.provider.hasVision());
             await this.hooksRunner.runBeforeHook('researcher', state.url);
             const annotatedElements = await this.explorer.annotateElements();
             debugLog(`Annotated ${annotatedElements.length} interactive elements with eidx`);
@@ -114,11 +114,11 @@ export class Researcher extends ResearcherBase {
             if (!deep && !force) {
                 const similar = await findSimilarResearch(combinedHtml);
                 if (similar) {
-                    tag('info').log('Similar research found, reusing cached result');
+                    tag('substep').log('Similar research found, reusing cached result');
                     if (stateHash)
                         saveResearch(stateHash, similar, combinedHtml);
                     tag('multiline').log(formatResearchSummary(similar));
-                    tag('success').log(`Research complete! ${similar.length} characters (reused)`);
+                    tag('success').log('Research complete (reused)');
                     await this.hooksRunner.runAfterHook('researcher', state.url);
                     return similar;
                 }
@@ -236,7 +236,12 @@ export class Researcher extends ResearcherBase {
                     markSectionAsFocused(result, fallback);
             }
             if (!interrupted() && deep) {
-                await this.performDeepAnalysis(state, result);
+                try {
+                    await this.performDeepAnalysis(state, result);
+                }
+                catch (err) {
+                    tag('warning').log(`Deep analysis failed, continuing with best-effort research: ${err instanceof Error ? err.message : err}`);
+                }
             }
             if (!interrupted() && data) {
                 const extractedData = await this.extractData(state);
@@ -257,7 +262,7 @@ export class Researcher extends ResearcherBase {
                     this.experienceTracker.updateSummary(this.actionResult, summaryLine);
             }
             tag('multiline').log(formatResearchSummary(result.text, { visionUsed: this.hasScreenshotToAnalyze }));
-            tag('success').log(`Research complete! ${result.text.length} characters`);
+            tag('success').log('Research complete');
             if (researchFile)
                 tag('substep').log(`Research file saved to: ${researchFile}`);
             if (this.actionResult?.screenshotFile) {

package/dist/src/ai/session-analyst.js CHANGED Viewed

@@ -105,12 +105,36 @@ export class SessionAnalyst {
             .slice(-30)
             .map((entry) => `  - [${entry.type}] ${entry.content}`)
             .join('\n');
+        const checked = test.getCheckedExpectations().join(' | ') || '(none)';
+        const remaining = test.getRemainingExpectations().join(' | ') || '(none)';
+        const notes = test
+            .getPrintableNotes()
+            .slice(-12)
+            .map((note) => `  - ${note}`)
+            .join('\n');
+        const visitedUrls = test.getVisitedUrls({ localOnly: true }).join(' | ') || '(none)';
+        const verification = test.verification
+            ? dedent `
+          verification_status: ${test.verification.status || 'unknown'}
+          verification_message: ${test.verification.message || '(none)'}
+          verification_url: ${test.verification.url || '(none)'}
+          verification_page: ${test.verification.pageLabel || '(none)'}
+          verification_details:
+          ${(test.verification.details.length > 0 ? test.verification.details : ['(none)']).map((detail) => `  - ${detail}`).join('\n')}
+        `
+            : 'verification_status: none';
         return dedent `
       <test ref="#${ref}">
       url: ${test.startUrl || '/'}
       scenario: ${test.scenario}
       result: ${test.result || 'unknown'}
       expected: ${test.expected.join(' | ') || '(none)'}
+      checked_expectations: ${checked}
+      remaining_expectations: ${remaining}
+      visited_urls: ${visitedUrls}
+      ${verification}
+      notes:
+      ${notes || '  - (none)'}
       log:
       ${log}
       </test>

package/dist/src/ai/tester.js CHANGED Viewed

@@ -92,7 +92,6 @@ export class Tester extends TaskAgent {
         const state = this.explorer.getStateManager().getCurrentState();
         if (!state)
             throw new Error('No state found');
-        tag('info').log(`Testing scenario: ${task.scenario}`);
         setActivity(`🧪 Testing: ${task.scenario}`, 'action');
         this.previousUrl = null;
         this.previousStateHash = null;
@@ -595,7 +594,6 @@ export class Tester extends TaskAgent {
         if (!task.hasFinished) {
             task.finish(TestResult.FAILED);
         }
-        tag('info').log(`Finished: ${task.scenario}`);
         if (task.isSuccessful) {
             tag('success').log(`Successful test: ${task.scenario}`);
         }
@@ -792,7 +790,9 @@ export class Tester extends TaskAgent {
                     if (this.getCurrentState().isInsideIframe) {
                         await this.explorer.switchToMainFrame();
                     }
-                    if (this.explorer.getStateManager().getCurrentState()?.url === resetUrl) {
+                    const currentState = this.explorer.getStateManager().getCurrentState();
+                    const currentUrl = currentState?.fullUrl || currentState?.url;
+                    if (currentUrl === resetUrl) {
                         return {
                             success: false,
                             message: 'Reset failed - already on initial page!',

package/dist/src/ai/tools.js CHANGED Viewed

@@ -731,11 +731,12 @@ export function createAgentTools({ explorer, researcher, navigator, experienceTr
             }),
             execute: async ({ reason }) => {
                 const stateManager = explorer.getStateManager();
-                const currentUrl = stateManager.getCurrentState()?.url;
+                const currentState = stateManager.getCurrentState();
+                const currentUrl = currentState?.fullUrl || currentState?.url;
                 const history = stateManager.getStateHistory();
                 let targetUrl = null;
                 for (let i = history.length - 1; i >= 0; i--) {
-                    const url = history[i].toState.url;
+                    const url = history[i].toState.fullUrl || history[i].toState.url;
                     if (url !== currentUrl) {
                         targetUrl = url;
                         break;

package/dist/src/commands/explore-command.js CHANGED Viewed

@@ -34,6 +34,10 @@ export class ExploreCommand extends BaseCommand {
     failedSubPages = new Set();
     oldTestRefs = new Set();
     priorityFilter;
+    getCurrentPageUrl() {
+        const state = this.explorBot.getExplorer().getStateManager().getCurrentState();
+        return state?.fullUrl || state?.url;
+    }
     async execute(args) {
         const { opts, args: remaining } = this.parseArgs(args);
         if (opts.maxTests) {
@@ -49,7 +53,7 @@ export class ExploreCommand extends BaseCommand {
             tag('info').log('Dry-run mode: planner runs to discover new tests; test execution is skipped');
         Stats.mode ??= 'explore';
         Stats.focus ??= feature;
-        const mainUrl = this.explorBot.getExplorer().getStateManager().getCurrentState()?.url;
+        const mainUrl = this.getCurrentPageUrl();
         if (cfg.enabled) {
             await this.runReuseMode(mainUrl, feature, cfg);
         }

package/dist/src/components/LogPane.js CHANGED Viewed

@@ -10,6 +10,15 @@ const LogPane = React.memo(({ verboseMode }) => {
     const [logs, setLogs] = useState([]);
     const pendingLogsRef = React.useRef([]);
     const flushTimeoutRef = React.useRef(null);
+    const MAX_MULTILINE_LINES = 16;
+    const MAX_STEP_LINES = 8;
+    const MAX_SUBSTEP_LINES = 6;
+    const formatCollapsedContent = useCallback((lines, collapsedCount, label) => {
+        if (collapsedCount <= 0) {
+            return lines.join('\n');
+        }
+        return [`... ${collapsedCount} earlier ${label}`, ...lines].join('\n');
+    }, []);
     const flushLogs = useCallback(() => {
         if (pendingLogsRef.current.length === 0)
             return;
@@ -27,11 +36,33 @@ const LogPane = React.memo(({ verboseMode }) => {
                 if (lastLog.type === logEntry.type && lastLog.content === logEntry.content && Math.abs((lastLog.timestamp?.getTime() || 0) - (logEntry.timestamp?.getTime() || 0)) < 1000) {
                     continue;
                 }
+                if ((logEntry.type === 'step' || logEntry.type === 'substep') && lastLog.type === logEntry.type && Math.abs((lastLog.timestamp?.getTime() || 0) - (logEntry.timestamp?.getTime() || 0)) < 1500) {
+                    const currentLines = String(logEntry.content)
+                        .split('\n')
+                        .filter((line) => line.length > 0);
+                    const previousLines = String(lastLog.content)
+                        .split('\n')
+                        .filter((line) => line.length > 0);
+                    const visiblePreviousLines = lastLog.collapsedCount ? previousLines.slice(1) : previousLines;
+                    const maxLines = logEntry.type === 'step' ? MAX_STEP_LINES : MAX_SUBSTEP_LINES;
+                    const mergedLines = [...visiblePreviousLines, ...currentLines];
+                    const overflow = Math.max(0, mergedLines.length - maxLines);
+                    const collapsedCount = (lastLog.collapsedCount || 0) + overflow;
+                    const visibleLines = mergedLines.slice(-maxLines);
+                    const label = logEntry.type === 'step' ? 'steps' : 'details';
+                    result[result.length - 1] = {
+                        ...lastLog,
+                        content: formatCollapsedContent(visibleLines, collapsedCount, label),
+                        timestamp: logEntry.timestamp,
+                        collapsedCount,
+                    };
+                    continue;
+                }
                 result.push(logEntry);
             }
             return result;
         });
-    }, []);
+    }, [formatCollapsedContent]);
     const addLog = useCallback((logEntry) => {
         pendingLogsRef.current.push(logEntry);
         if (!flushTimeoutRef.current) {
@@ -85,10 +116,9 @@ const LogPane = React.memo(({ verboseMode }) => {
             const cleaned = stripAnsi(dedent(log.content));
             const parsed = parseMarkdownToTerminal(cleaned);
             const lines = parsed.split('\n');
-            const maxLines = 30;
-            const truncated = lines.length > maxLines ? `${lines.slice(0, maxLines).join('\n')}\n... (${lines.length - maxLines} more lines)` : cleaned;
+            const truncated = lines.length > MAX_MULTILINE_LINES ? `${lines.slice(0, MAX_MULTILINE_LINES).join('\n')}\n... (${lines.length - MAX_MULTILINE_LINES} more lines)` : parsed;
             return (React.createElement(Box, { key: index, borderStyle: "classic", borderLeft: false, borderRight: false, marginY: 1, padding: 1, borderColor: "dim", overflow: "hidden" },
-                React.createElement(Text, { color: "gray", dimColor: true }, parsed)));
+                React.createElement(Text, { color: "gray", dimColor: true }, truncated)));
         }
         if (log.type === 'html') {
             // Convert HTML to markdown, then render as multiline

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "explorbot",
-  "version": "0.1.18",
+  "version": "0.1.20",
   "description": "CLI app built with React Ink, CodeceptJS, and Playwright",
   "license": "Elastic-2.0",
   "type": "module",

package/src/action.ts CHANGED Viewed

@@ -2,7 +2,6 @@ import fs from 'node:fs';
 import { join } from 'node:path';
 import { faker } from '@faker-js/faker';
 import { context, trace } from '@opentelemetry/api';
-import { highlight } from 'cli-highlight';
 import { container, recorder } from 'codeceptjs';
 import * as codeceptjs from 'codeceptjs';
 import { hopeThat, retryTo, tryTo, within } from 'codeceptjs/lib/effects';
@@ -21,7 +20,7 @@ import type { PlaywrightRecorder } from './playwright-recorder.ts';
 import type { StateManager } from './state-manager.js';
 import { extractCodeBlocks } from './utils/code-extractor.js';
 import { htmlCombinedSnapshot, minifyHtml } from './utils/html.js';
-import { createDebug, log, setStepSpanParent, tag } from './utils/logger.js';
+import { createDebug, setStepSpanParent, tag } from './utils/logger.js';
 import { safeFilename } from './utils/strings.ts';
 import { throttle } from './utils/throttle.ts';
@@ -296,7 +295,13 @@ class Action {
   async expect(codeOrFunction: string | ((I: CodeceptJS.I) => void)): Promise<Action> {
     const codeString = typeof codeOrFunction === 'string' ? codeOrFunction : codeOrFunction.toString();
     this.expectation = codeString.toString();
-    log('Expecting', highlight(codeString, { language: 'javascript' }));
+    const expectationPreview = sanitizeCodeBlock(codeString)
+      .split('\n')
+      .map((line) => line.trim())
+      .filter(Boolean)
+      .slice(0, 2)
+      .join(' ');
+    tag('step').log(`Expecting: ${expectationPreview || 'assertion'}`);
     try {
       debugLog('Executing expectation:', codeString);

package/src/ai/driller.ts CHANGED Viewed

@@ -168,7 +168,7 @@ export class Driller extends TaskAgent implements Agent {
     this.allResults = [];
     return Observability.run(`driller: ${currentState.url}`, { tags: ['driller'], sessionId: sessionName }, async () => {
-      tag('info').log(`Driller starting on ${currentState.url}`);
+      tag('step').log(`Drilling page: ${currentState.url}`);
       await this.hooksRunner.runBeforeHook('driller', currentState.url);
       const originalState = await this.captureAnnotatedState();

package/src/ai/navigator.ts CHANGED Viewed

@@ -80,8 +80,48 @@ class Navigator implements Agent {
     this.hooksRunner = new HooksRunner(explorer, explorer.getConfig());
   }
+  private getBaseOrigin(): string | null {
+    const baseUrl = this.explorer.getConfig().playwright.url;
+    try {
+      return new URL(baseUrl).origin;
+    } catch {
+      return null;
+    }
+  }
+  private getComparableCurrentUrl(stateManager: any, expectedUrl: string): string {
+    const currentState = stateManager.getCurrentState();
+    if (!currentState) return '';
+    const current = /^https?:\/\//i.test(expectedUrl) ? currentState.fullUrl || currentState.url || '' : currentState.url || '';
+    return current;
+  }
+  private isSameExpectedOrigin(expectedUrl: string, stateManager: any): boolean {
+    const currentState = stateManager.getCurrentState();
+    if (!currentState) return false;
+    const currentFullUrl = currentState.fullUrl || currentState.url || '';
+    if (!currentFullUrl) return false;
+    try {
+      const currentOrigin = new URL(currentFullUrl).origin;
+      if (/^https?:\/\//i.test(expectedUrl)) {
+        return currentOrigin === new URL(expectedUrl).origin;
+      }
+      const baseOrigin = this.getBaseOrigin();
+      if (!baseOrigin) return true;
+      return currentOrigin === baseOrigin;
+    } catch {
+      return !/^https?:\/\//i.test(expectedUrl);
+    }
+  }
   private isOnExpectedPage(expectedUrl: string, stateManager: any): boolean {
-    const currentUrl = stateManager.getCurrentState()?.url || '';
+    if (!this.isSameExpectedOrigin(expectedUrl, stateManager)) {
+      return false;
+    }
+    const currentUrl = this.getComparableCurrentUrl(stateManager, expectedUrl);
     return normalizeUrl(currentUrl) === normalizeUrl(expectedUrl);
   }
@@ -282,7 +322,8 @@ class Navigator implements Agent {
             }
           }
           const freshState = await action.capturePageState();
-          const urlMatches = normalizeUrl(freshState.url || '') === normalizeUrl(expectedUrl);
+          const currentUrl = /^https?:\/\//i.test(expectedUrl) ? freshState.fullUrl || freshState.url || '' : freshState.url || '';
+          const urlMatches = this.isSameExpectedOrigin(expectedUrl, action.stateManager) && normalizeUrl(currentUrl) === normalizeUrl(expectedUrl);
           const stateChanged = freshState.getStateHash() !== actionResult.getStateHash();
           resolved = urlMatches && stateChanged;

package/src/ai/pilot.ts CHANGED Viewed

@@ -313,6 +313,9 @@ export class Pilot implements Agent {
       overrides the others — weigh them together. Tester's record() notes are the LEAST reliable; always
       cross-check against actual actions and state. Visual screenshot analysis is strong for UI state
       (active tabs, visible counts, colors).
+      If the final page clearly shows an equivalent success state in a different UI form, do not fail only
+      because one narrow assertion targeted a specific badge, count, toast, or wording that the product
+      represents differently.
       SCENARIO TITLE defines what must happen. Action verbs require persisted evidence:
       - "Create X" → X must exist (visible, redirected to its page, or success message). Opening a form is NOT enough.
@@ -355,6 +358,8 @@ export class Pilot implements Agent {
       GUIDANCE (required for "continue"): a specific next action on the current page — which tool, what
       to verify, how to record. Do not suggest repeating actions that already succeeded.
+      If progress is blocked only because the page lacks target data for the scenario, prefer precondition()
+      over repeated UI attempts.
     `;
   }

package/src/ai/planner.ts CHANGED Viewed

@@ -80,6 +80,10 @@ export class Planner extends PlannerBase implements Agent {
     return ConfigParser.getInstance().getConfig().ai?.agents?.researcher?.sections || Object.keys(POSSIBLE_SECTIONS);
   }
+  private getDefaultStartUrl(state: { url: string; fullUrl?: string }): string {
+    return state.fullUrl || state.url;
+  }
   getSystemMessage(feature?: string): string {
     const currentUrl = this.stateManager.getCurrentState()?.url;
     const customPrompt = this.provider.getSystemPromptForAgent('planner', currentUrl);
@@ -160,7 +164,6 @@ export class Planner extends PlannerBase implements Agent {
     this.freshStart = false;
     setActivity(`${this.emoji} Planning...`, 'action');
-    tag('info').log(`Planning test scenarios for ${state.url}`);
     if (style) tag('info').log(`Planning style: ${style}`);
     const tags = ['planner'];
@@ -188,7 +191,8 @@ export class Planner extends PlannerBase implements Agent {
         throw new Error('No tasks were created successfully');
       }
-      const fromPlanning = aiResult.object.scenarios.map((s: any) => new Test(s.scenario, s.priority, s.expectedOutcomes, s.startUrl || state.url, s.steps || []));
+      const defaultStartUrl = this.getDefaultStartUrl(state);
+      const fromPlanning = aiResult.object.scenarios.map((s: any) => new Test(s.scenario, s.priority, s.expectedOutcomes, s.startUrl || defaultStartUrl, s.steps || []));
       return { tests: fromPlanning, planName: aiResult.object.planName };
     });
@@ -200,7 +204,8 @@ export class Planner extends PlannerBase implements Agent {
       const cached = state.url ? getRegisteredPlan(state.url) : null;
       const planName = feature || cached?.plan.title || result.planName || state.url;
       this.currentPlan = new Plan(planName);
-      this.currentPlan.url = state.url;
+      this.currentPlan.url = this.getDefaultStartUrl(state);
+      const defaultStartUrl = this.getDefaultStartUrl(state);
       if (parentPlan) this.currentPlan.parentPlan = parentPlan;
       const allPreviousScenarios = this.getPreviousSessionScenarios();
       const existingTestScenarios = this.getExistingTestFileScenarios(state.url);
@@ -208,13 +213,13 @@ export class Planner extends PlannerBase implements Agent {
       for (const t of tests) {
         if (allPreviousScenarios.has(t.scenario.toLowerCase())) continue;
         t.style = this.lastStyleName;
-        t.startUrl = state.url;
+        t.startUrl = defaultStartUrl;
         this.currentPlan.addTest(t);
       }
     } else {
       tag('step').log(`Expanding plan: "${this.currentPlan.title}"`);
       this.currentPlan.nextIteration();
-      const newTests = this.addNewTests(tests, state.url);
+      const newTests = this.addNewTests(tests, this.getDefaultStartUrl(state));
       if (newTests.length > 0) {
         const summary = `New scenarios:\n${newTests.map((t) => `+ [${t.priority}] ${t.scenario}`).join('\n')}`;
         tag('multiline').log(summary);
@@ -331,6 +336,13 @@ export class Planner extends PlannerBase implements Agent {
       Focus on URL page change or data persistency after page reload.
       If there are subpages (pages with same URL path) plan testing of those subpages as well
       If you plan to test CRUD operations, plan them in correct order: create, read, update.
+      Do not invent specific route names, success messages, validation texts, badge counts, or welcome messages unless they are visible in research, visited pages, or prior observed flows.
+      If exact wording is unknown, describe the expected result generically, for example "an authentication error is shown" or "the user stays on the login page" instead of guessing the literal text.
+      If exact redirect destination is unknown, describe the destination by visible page identity, for example "the dashboard page opens" or "the current workspace home page opens" instead of inventing a URL slug.
+      Only propose scenarios whose prerequisites are evident from page research, visited pages, or API data preparation context.
+      If a scenario needs existing records, recipients, results, notifications, or other target data, propose it only when that data is visible or API preconditions can create it.
+      If the page appears read-only, degraded, demo-limited, maintenance-like, or lacks write controls, prefer read-only scenarios such as opening panels, inspecting visible lists, filtering, searching, or verifying current state.
+      Do not assume hidden data exists just because a control is present.
       DO NOT propose "verification-only" tests that merely open a UI element (modal, dropdown, panel) and check it exists.
       Every test must complete a meaningful action that changes application state or produces a business outcome.
       Opening a modal is NOT a test — performing an action INSIDE the modal IS a test.
@@ -566,10 +578,15 @@ export class Planner extends PlannerBase implements Agent {
          - Good: "New suite 'My New Suite' appears in the suite list"
          - Good: "Suite appears under Starred filter tab"
          - Good: "Success message 'Suite created' is displayed"
+         - Good when wording is unknown: "An authentication error is displayed"
+         - Good when route is unknown: "The workspace home page is displayed"
          - Bad: "Modal is displayed" (just verifying existence, no business value)
          - Bad: "Dropdown menu is visible" (just verifying existence)
+         - Bad: "Welcome message is displayed" if no welcome message is visible in research
+         - Bad: "Redirected to /dashboard" if no such route was observed
          - Each outcome should be independently verifiable
          - Avoid combining multiple checks into one outcome
+         - Prefer durable user-facing results over fragile micro-signals
          - Expected outcomes describe WHAT TO VERIFY
          FORMATTING RULES:

package/src/ai/rerunner.ts CHANGED Viewed

@@ -87,7 +87,7 @@ export class Rerunner extends TaskAgent implements Agent {
       return { total: 0, passed: 0, failed: 0, healed: 0 };
     }
-    tag('info').log(`Re-running tests from: ${relative(process.cwd(), absPath)}`);
+    tag('step').log(`Re-running tests from: ${relative(process.cwd(), absPath)}`);
     setActivity('🔄 Re-running tests...', 'action');
     this.healedSteps = [];

package/src/ai/researcher/deep-analysis.ts CHANGED Viewed

@@ -24,7 +24,7 @@ export function WithDeepAnalysis<T extends Constructor>(Base: T) {
     async performDeepAnalysis(state: WebPageState, result: ResearchResult): Promise<void> {
       tag('info').log('Starting deep analysis of expandable elements');
-      await (this as any).navigateTo(state.url);
+      await (this as any).navigateTo(state.fullUrl || state.url);
       let expandables = await this._discoverExpandables(result.text);
       if (expandables.length === 0) {
@@ -35,7 +35,7 @@ export function WithDeepAnalysis<T extends Constructor>(Base: T) {
       const maxClicks = (this.explorer.getConfig().ai?.agents?.researcher as any)?.maxExpandableClicks ?? DEFAULT_MAX_EXPANDABLE_CLICKS;
       if (expandables.length > maxClicks) {
-        expandables = await this._selectExpandables(expandables, state.url, maxClicks);
+        expandables = await this._selectExpandables(expandables, state.fullUrl || state.url, maxClicks);
         tag('substep').log(`Selected ${expandables.length} expandables to click (max: ${maxClicks})`);
       }
@@ -177,7 +177,14 @@ export function WithDeepAnalysis<T extends Constructor>(Base: T) {
         visionCall = this.provider.processImage(visionPrompt, screenshot.toString('base64'));
       }
-      const [textRes, visionRes] = await Promise.all([textCall, visionCall]);
+      let textRes: { text?: string } | null = null;
+      let visionRes: { text?: string } | null = null;
+      try {
+        [textRes, visionRes] = await Promise.all([textCall, visionCall]);
+      } catch (err) {
+        tag('warning').log(`Expandable discovery failed, skipping deep analysis: ${err instanceof Error ? err.message : err}`);
+        return [];
+      }
       const eidxSet = new Set<string>();
       const parseRefs = (text: string | undefined) => {
@@ -244,10 +251,16 @@ export function WithDeepAnalysis<T extends Constructor>(Base: T) {
       `;
       const model = this.provider.getModelForAgent('researcher');
-      const r = await this.provider.chat([{ role: 'user', content: prompt }], model, {
-        agentName: 'researcher',
-        telemetryFunctionId: 'researcher.selectExpandables',
-      });
+      let r: { text?: string };
+      try {
+        r = await this.provider.chat([{ role: 'user', content: prompt }], model, {
+          agentName: 'researcher',
+          telemetryFunctionId: 'researcher.selectExpandables',
+        });
+      } catch (err) {
+        tag('warning').log(`Expandable selection failed, using first ${maxClicks}: ${err instanceof Error ? err.message : err}`);
+        return expandables.slice(0, maxClicks);
+      }
       const nums = (r.text || '').match(/\d+/g)?.map(Number) || [];
       const selected = expandables.filter((_, i) => nums.includes(i + 1));

package/src/ai/researcher.ts CHANGED Viewed

@@ -125,7 +125,7 @@ export class Researcher extends ResearcherBase implements Agent {
       tag('info').log(`Researching ${displayUrl} to understand the context...`);
       setActivity(`${this.emoji} Researching...`, 'action');
-      await this.ensureNavigated(state.url, screenshot && this.provider.hasVision());
+      await this.ensureNavigated(displayUrl, screenshot && this.provider.hasVision());
       await this.hooksRunner.runBeforeHook('researcher', state.url);
       const annotatedElements = await this.explorer.annotateElements();
@@ -151,10 +151,10 @@ export class Researcher extends ResearcherBase implements Agent {
       if (!deep && !force) {
         const similar = await findSimilarResearch(combinedHtml);
         if (similar) {
-          tag('info').log('Similar research found, reusing cached result');
+          tag('substep').log('Similar research found, reusing cached result');
           if (stateHash) saveResearch(stateHash, similar, combinedHtml);
           tag('multiline').log(formatResearchSummary(similar));
-          tag('success').log(`Research complete! ${similar.length} characters (reused)`);
+          tag('success').log('Research complete (reused)');
           await this.hooksRunner.runAfterHook('researcher', state.url);
           return similar;
         }
@@ -285,7 +285,11 @@ export class Researcher extends ResearcherBase implements Agent {
       }
       if (!interrupted() && deep) {
-        await this.performDeepAnalysis(state, result);
+        try {
+          await this.performDeepAnalysis(state, result);
+        } catch (err) {
+          tag('warning').log(`Deep analysis failed, continuing with best-effort research: ${err instanceof Error ? err.message : err}`);
+        }
       }
       if (!interrupted() && data) {
@@ -311,7 +315,7 @@ export class Researcher extends ResearcherBase implements Agent {
       }
       tag('multiline').log(formatResearchSummary(result.text, { visionUsed: this.hasScreenshotToAnalyze }));
-      tag('success').log(`Research complete! ${result.text.length} characters`);
+      tag('success').log('Research complete');
       if (researchFile) tag('substep').log(`Research file saved to: ${researchFile}`);
       if (this.actionResult?.screenshotFile) {
         const screenshotPath = outputPath('states', this.actionResult.screenshotFile);

package/src/ai/session-analyst.ts CHANGED Viewed

@@ -120,6 +120,24 @@ export class SessionAnalyst implements Agent {
       .slice(-30)
       .map((entry) => `  - [${entry.type}] ${entry.content}`)
       .join('\n');
+    const checked = test.getCheckedExpectations().join(' | ') || '(none)';
+    const remaining = test.getRemainingExpectations().join(' | ') || '(none)';
+    const notes = test
+      .getPrintableNotes()
+      .slice(-12)
+      .map((note) => `  - ${note}`)
+      .join('\n');
+    const visitedUrls = test.getVisitedUrls({ localOnly: true }).join(' | ') || '(none)';
+    const verification = test.verification
+      ? dedent`
+          verification_status: ${test.verification.status || 'unknown'}
+          verification_message: ${test.verification.message || '(none)'}
+          verification_url: ${test.verification.url || '(none)'}
+          verification_page: ${test.verification.pageLabel || '(none)'}
+          verification_details:
+          ${(test.verification.details.length > 0 ? test.verification.details : ['(none)']).map((detail) => `  - ${detail}`).join('\n')}
+        `
+      : 'verification_status: none';
     return dedent`
       <test ref="#${ref}">
@@ -127,6 +145,12 @@ export class SessionAnalyst implements Agent {
       scenario: ${test.scenario}
       result: ${test.result || 'unknown'}
       expected: ${test.expected.join(' | ') || '(none)'}
+      checked_expectations: ${checked}
+      remaining_expectations: ${remaining}
+      visited_urls: ${visitedUrls}
+      ${verification}
+      notes:
+      ${notes || '  - (none)'}
       log:
       ${log}
       </test>

package/src/ai/tester.ts CHANGED Viewed

@@ -118,7 +118,6 @@ export class Tester extends TaskAgent implements Agent {
     const state = this.explorer.getStateManager().getCurrentState();
     if (!state) throw new Error('No state found');
-    tag('info').log(`Testing scenario: ${task.scenario}`);
     setActivity(`🧪 Testing: ${task.scenario}`, 'action');
     this.previousUrl = null;
@@ -678,7 +677,6 @@ export class Tester extends TaskAgent implements Agent {
     if (!task.hasFinished) {
       task.finish(TestResult.FAILED);
     }
-    tag('info').log(`Finished: ${task.scenario}`);
     if (task.isSuccessful) {
       tag('success').log(`Successful test: ${task.scenario}`);
@@ -882,7 +880,9 @@ export class Tester extends TaskAgent implements Agent {
             await this.explorer.switchToMainFrame();
           }
-          if (this.explorer.getStateManager().getCurrentState()?.url === resetUrl!) {
+          const currentState = this.explorer.getStateManager().getCurrentState();
+          const currentUrl = currentState?.fullUrl || currentState?.url;
+          if (currentUrl === resetUrl!) {
             return {
               success: false,
               message: 'Reset failed - already on initial page!',

package/src/ai/tools.ts CHANGED Viewed

@@ -854,12 +854,13 @@ export function createAgentTools({
       }),
       execute: async ({ reason }) => {
         const stateManager = explorer.getStateManager();
-        const currentUrl = stateManager.getCurrentState()?.url;
+        const currentState = stateManager.getCurrentState();
+        const currentUrl = currentState?.fullUrl || currentState?.url;
         const history = stateManager.getStateHistory();
         let targetUrl: string | null = null;
         for (let i = history.length - 1; i >= 0; i--) {
-          const url = history[i].toState.url;
+          const url = history[i].toState.fullUrl || history[i].toState.url;
           if (url !== currentUrl) {
             targetUrl = url;
             break;

package/src/commands/explore-command.ts CHANGED Viewed

@@ -38,6 +38,11 @@ export class ExploreCommand extends BaseCommand {
   private oldTestRefs = new Set<Test>();
   private priorityFilter?: Set<string>;
+  private getCurrentPageUrl(): string | undefined {
+    const state = this.explorBot.getExplorer().getStateManager().getCurrentState();
+    return state?.fullUrl || state?.url;
+  }
   async execute(args: string): Promise<void> {
     const { opts, args: remaining } = this.parseArgs(args);
     if (opts.maxTests) {
@@ -51,7 +56,7 @@ export class ExploreCommand extends BaseCommand {
     if (this.dryRun) tag('info').log('Dry-run mode: planner runs to discover new tests; test execution is skipped');
     Stats.mode ??= 'explore';
     Stats.focus ??= feature;
-    const mainUrl = this.explorBot.getExplorer().getStateManager().getCurrentState()?.url;
+    const mainUrl = this.getCurrentPageUrl();
     if (cfg.enabled) {
       await this.runReuseMode(mainUrl, feature, cfg);

package/src/components/LogPane.tsx CHANGED Viewed

@@ -7,21 +7,32 @@ import { parseMarkdownToTerminal } from '../utils/markdown-terminal.js';
 import { Box, Text } from 'ink';
 import type { LogType, TaggedLogEntry } from '../utils/logger.js';
-import { isDebugMode, registerLogPane, setVerboseMode, unregisterLogPane } from '../utils/logger.js';
+import { isDebugMode, registerLogPane, unregisterLogPane } from '../utils/logger.js';
 // marked.use(new markedTerminal());
-type LogEntry = TaggedLogEntry;
+type LogEntry = TaggedLogEntry & { collapsedCount?: number };
 interface LogPaneProps {
   verboseMode: boolean;
 }
 const LogPane: React.FC<LogPaneProps> = React.memo(({ verboseMode }) => {
-  const [logs, setLogs] = useState<TaggedLogEntry[]>([]);
-  const pendingLogsRef = React.useRef<TaggedLogEntry[]>([]);
+  const [logs, setLogs] = useState<LogEntry[]>([]);
+  const pendingLogsRef = React.useRef<LogEntry[]>([]);
   const flushTimeoutRef = React.useRef<ReturnType<typeof setTimeout> | null>(null);
+  const MAX_MULTILINE_LINES = 16;
+  const MAX_STEP_LINES = 8;
+  const MAX_SUBSTEP_LINES = 6;
+  const formatCollapsedContent = useCallback((lines: string[], collapsedCount: number, label: string) => {
+    if (collapsedCount <= 0) {
+      return lines.join('\n');
+    }
+    return [`... ${collapsedCount} earlier ${label}`, ...lines].join('\n');
+  }, []);
   const flushLogs = useCallback(() => {
     if (pendingLogsRef.current.length === 0) return;
@@ -29,7 +40,7 @@ const LogPane: React.FC<LogPaneProps> = React.memo(({ verboseMode }) => {
     pendingLogsRef.current = [];
     flushTimeoutRef.current = null;
-    setLogs((prevLogs: TaggedLogEntry[]) => {
+    setLogs((prevLogs: LogEntry[]) => {
       const result = [...prevLogs];
       for (const logEntry of newLogs) {
@@ -43,12 +54,35 @@ const LogPane: React.FC<LogPaneProps> = React.memo(({ verboseMode }) => {
           continue;
         }
+        if ((logEntry.type === 'step' || logEntry.type === 'substep') && lastLog.type === logEntry.type && Math.abs((lastLog.timestamp?.getTime() || 0) - (logEntry.timestamp?.getTime() || 0)) < 1500) {
+          const currentLines = String(logEntry.content)
+            .split('\n')
+            .filter((line) => line.length > 0);
+          const previousLines = String(lastLog.content)
+            .split('\n')
+            .filter((line) => line.length > 0);
+          const visiblePreviousLines = lastLog.collapsedCount ? previousLines.slice(1) : previousLines;
+          const maxLines = logEntry.type === 'step' ? MAX_STEP_LINES : MAX_SUBSTEP_LINES;
+          const mergedLines = [...visiblePreviousLines, ...currentLines];
+          const overflow = Math.max(0, mergedLines.length - maxLines);
+          const collapsedCount = (lastLog.collapsedCount || 0) + overflow;
+          const visibleLines = mergedLines.slice(-maxLines);
+          const label = logEntry.type === 'step' ? 'steps' : 'details';
+          result[result.length - 1] = {
+            ...lastLog,
+            content: formatCollapsedContent(visibleLines, collapsedCount, label),
+            timestamp: logEntry.timestamp,
+            collapsedCount,
+          };
+          continue;
+        }
         result.push(logEntry);
       }
       return result;
     });
-  }, []);
+  }, [formatCollapsedContent]);
   const addLog = useCallback(
     (logEntry: TaggedLogEntry) => {
@@ -112,12 +146,11 @@ const LogPane: React.FC<LogPaneProps> = React.memo(({ verboseMode }) => {
       const cleaned = stripAnsi(dedent(log.content));
       const parsed = parseMarkdownToTerminal(cleaned);
       const lines = parsed.split('\n');
-      const maxLines = 30;
-      const truncated = lines.length > maxLines ? `${lines.slice(0, maxLines).join('\n')}\n... (${lines.length - maxLines} more lines)` : cleaned;
+      const truncated = lines.length > MAX_MULTILINE_LINES ? `${lines.slice(0, MAX_MULTILINE_LINES).join('\n')}\n... (${lines.length - MAX_MULTILINE_LINES} more lines)` : parsed;
       return (
         <Box key={index} borderStyle="classic" borderLeft={false} borderRight={false} marginY={1} padding={1} borderColor="dim" overflow="hidden">
           <Text color="gray" dimColor>
-            {parsed}
+            {truncated}
           </Text>
         </Box>
       );