npm - nodebench-mcp - Versions diffs - 2.20.2 → 2.21.1 - Mend

nodebench-mcp 2.20.2 → 2.21.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/dist/__tests__/tools.test.js +4 -2
package/dist/__tests__/tools.test.js.map +1 -1
package/dist/db.js +109 -0
package/dist/db.js.map +1 -1
package/dist/index.js +3 -3
package/dist/index.js.map +1 -1
package/dist/tools/progressiveDiscoveryTools.js +2 -2
package/dist/tools/progressiveDiscoveryTools.js.map +1 -1
package/dist/tools/toolRegistry.js +101 -0
package/dist/tools/toolRegistry.js.map +1 -1
package/dist/tools/uiUxDiveAdvancedTools.d.ts +20 -0
package/dist/tools/uiUxDiveAdvancedTools.js +883 -0
package/dist/tools/uiUxDiveAdvancedTools.js.map +1 -0
package/dist/toolsetRegistry.js +2 -0
package/dist/toolsetRegistry.js.map +1 -1
package/package.json +1 -1

package/dist/tools/uiUxDiveAdvancedTools.js ADDED Viewed

@@ -0,0 +1,883 @@
+/**
+ * UI/UX Full Dive v2 — Advanced Tools
+ *
+ * Deep interaction testing, screenshot capture, design auditing,
+ * backend context linking, changelog tracking, and walkthrough generation.
+ *
+ * These tools complement the base dive tools (uiUxDiveTools.ts) and work
+ * with the MCP Bridge (playwright-mcp) for browser automation.
+ *
+ * Architecture:
+ * - Agent uses MCP Bridge to drive the browser (navigate, click, type, screenshot)
+ * - These tools provide structured storage and analysis on top of bridge actions
+ * - Screenshots are saved to disk + thumbnail stored in DB for fast retrieval
+ * - Interaction tests define preconditions → steps → expected/actual per step
+ * - Design audits compare computed styles across components for inconsistencies
+ * - Backend links connect UI components to API endpoints, Convex functions, DB tables
+ * - Changelogs track before/after with screenshots when fixes are applied
+ */
+import { mkdirSync, writeFileSync, readFileSync, existsSync, readdirSync } from "node:fs";
+import { join, basename } from "node:path";
+import { homedir } from "node:os";
+import { createConnection } from "node:net";
+import { getDb } from "../db.js";
+function genId(prefix) {
+    return `${prefix}_${Date.now()}_${Math.random().toString(36).slice(2, 11)}`;
+}
+function screenshotDir() {
+    const dir = join(homedir(), ".nodebench", "dive-screenshots");
+    mkdirSync(dir, { recursive: true });
+    return dir;
+}
+/** Try to connect to a TCP port. Resolves true if something is listening. */
+function checkPort(port, host = "127.0.0.1", timeoutMs = 800) {
+    return new Promise((resolve) => {
+        const sock = createConnection({ port, host });
+        const timer = setTimeout(() => { sock.destroy(); resolve(false); }, timeoutMs);
+        sock.on("connect", () => { clearTimeout(timer); sock.destroy(); resolve(true); });
+        sock.on("error", () => { clearTimeout(timer); resolve(false); });
+    });
+}
+/** Recursively find files matching a test, up to maxDepth. */
+function findFiles(dir, test, maxDepth = 4, depth = 0) {
+    if (depth > maxDepth || !existsSync(dir))
+        return [];
+    const results = [];
+    try {
+        for (const entry of readdirSync(dir, { withFileTypes: true })) {
+            if (entry.name.startsWith(".") || entry.name === "node_modules" || entry.name === "dist" || entry.name === ".next")
+                continue;
+            const full = join(dir, entry.name);
+            if (entry.isFile() && test(entry.name))
+                results.push(full);
+            else if (entry.isDirectory())
+                results.push(...findFiles(full, test, maxDepth, depth + 1));
+        }
+    }
+    catch { /* permission errors etc */ }
+    return results;
+}
+/** Extract route paths from source code using common patterns. */
+function extractRoutes(srcDir) {
+    const routes = [];
+    const seen = new Set();
+    // Find files that likely contain route definitions
+    const routeFiles = findFiles(srcDir, (name) => /\.(tsx?|jsx?)$/.test(name) && (/[Rr]out/.test(name) || /[Aa]pp/.test(name) || /[Ll]ayout/.test(name) ||
+        /[Nn]avigation/.test(name) || /[Ss]idebar/.test(name) || /pages/.test(name)));
+    for (const file of routeFiles.slice(0, 30)) {
+        try {
+            const content = readFileSync(file, "utf-8");
+            // Match React Router <Route path="..." patterns
+            const routeMatches = content.matchAll(/path\s*[:=]\s*["'`](\/[^"'`]*?)["'`]/g);
+            for (const m of routeMatches) {
+                const p = m[1];
+                if (!seen.has(p)) {
+                    seen.add(p);
+                    // Try to find component name nearby
+                    const compMatch = content.slice(Math.max(0, m.index - 200), m.index + 200)
+                        .match(/(?:element|component)\s*[:=]\s*[{<]?\s*(\w+)/);
+                    routes.push({ path: p, file: file.replace(/\\/g, "/"), component: compMatch?.[1] });
+                }
+            }
+        }
+        catch { /* unreadable */ }
+    }
+    return routes.sort((a, b) => a.path.localeCompare(b.path));
+}
+export const uiUxDiveAdvancedTools = [
+    // ── 0. Project preflight — analyze project before diving ──────────────
+    {
+        name: "dive_preflight",
+        description: "Analyze a project BEFORE starting a UI dive. Scans the project directory to detect: framework (Vite, Next.js, CRA, etc.), dev scripts, required services (frontend, backend like Convex/Supabase/Firebase), port assignments, whether services are already running, route definitions from source code, and environment requirements. Returns a structured launch plan the agent should follow to get the app running before navigating. This is always Step 0 of a dive.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                projectPath: { type: "string", description: "Absolute path to the project root directory" },
+                checkPorts: {
+                    type: "boolean",
+                    description: "Whether to probe common ports to see what is already running (default: true)",
+                },
+                scanRoutes: {
+                    type: "boolean",
+                    description: "Whether to scan source code for route definitions (default: true)",
+                },
+            },
+            required: ["projectPath"],
+        },
+        handler: async (args) => {
+            const { projectPath, checkPorts: doCheckPorts, scanRoutes: doScanRoutes } = args;
+            if (!existsSync(projectPath)) {
+                return { error: true, message: `Project path not found: ${projectPath}` };
+            }
+            // ── 1. Read package.json ──
+            const pkgPath = join(projectPath, "package.json");
+            let pkg = null;
+            if (existsSync(pkgPath)) {
+                try {
+                    pkg = JSON.parse(readFileSync(pkgPath, "utf-8"));
+                }
+                catch { /* */ }
+            }
+            // ── 2. Detect framework ──
+            const deps = { ...pkg?.dependencies, ...pkg?.devDependencies };
+            const framework = { name: "unknown" };
+            const frameworkChecks = [
+                { name: "next", dep: "next", configs: ["next.config.js", "next.config.ts", "next.config.mjs"] },
+                { name: "vite", dep: "vite", configs: ["vite.config.ts", "vite.config.js", "vite.config.mjs"] },
+                { name: "create-react-app", dep: "react-scripts", configs: [] },
+                { name: "remix", dep: "@remix-run/react", configs: ["remix.config.js"] },
+                { name: "nuxt", dep: "nuxt", configs: ["nuxt.config.ts", "nuxt.config.js"] },
+                { name: "sveltekit", dep: "@sveltejs/kit", configs: ["svelte.config.js"] },
+                { name: "astro", dep: "astro", configs: ["astro.config.mjs", "astro.config.ts"] },
+                { name: "angular", dep: "@angular/core", configs: ["angular.json"] },
+                { name: "gatsby", dep: "gatsby", configs: ["gatsby-config.js", "gatsby-config.ts"] },
+            ];
+            for (const check of frameworkChecks) {
+                if (deps?.[check.dep]) {
+                    framework.name = check.name;
+                    framework.version = deps[check.dep];
+                    for (const cfg of check.configs) {
+                        if (existsSync(join(projectPath, cfg))) {
+                            framework.configFile = cfg;
+                            break;
+                        }
+                    }
+                    break;
+                }
+            }
+            // ── 3. Detect dev scripts ──
+            const scripts = pkg?.scripts ?? {};
+            const devScripts = [];
+            const scriptPriority = ["dev", "dev:frontend", "start", "dev:web", "serve", "develop"];
+            for (const name of Object.keys(scripts)) {
+                let likely = "unknown";
+                const cmd = scripts[name];
+                if (/vite|next dev|react-scripts start|nuxt dev|astro dev/.test(cmd))
+                    likely = "frontend";
+                else if (/convex dev|convex deploy/.test(cmd))
+                    likely = "backend (convex)";
+                else if (/node.*server|express|fastify|hono/.test(cmd))
+                    likely = "backend (api)";
+                else if (/tsc|typescript/.test(cmd))
+                    likely = "build";
+                else if (/vitest|jest|playwright|cypress/.test(cmd))
+                    likely = "test";
+                else if (/lint|eslint|prettier/.test(cmd))
+                    likely = "lint";
+                if (likely === "frontend" || likely.startsWith("backend") || scriptPriority.includes(name)) {
+                    devScripts.push({ name, command: cmd, likely });
+                }
+            }
+            // Sort by priority
+            devScripts.sort((a, b) => {
+                const ai = scriptPriority.indexOf(a.name);
+                const bi = scriptPriority.indexOf(b.name);
+                return (ai === -1 ? 99 : ai) - (bi === -1 ? 99 : bi);
+            });
+            // ── 4. Detect backend services ──
+            const services = [];
+            // Convex
+            if (existsSync(join(projectPath, "convex")) && (deps?.["convex"] || existsSync(join(projectPath, "convex.json")))) {
+                const convexScript = Object.entries(scripts).find(([, cmd]) => cmd.includes("convex dev"));
+                services.push({
+                    name: "Convex",
+                    type: "backend",
+                    detected: "convex/ directory + convex dependency",
+                    startCommand: convexScript ? `npm run ${convexScript[0]}` : "npx convex dev",
+                });
+            }
+            // Supabase
+            if (deps?.["@supabase/supabase-js"] || existsSync(join(projectPath, "supabase"))) {
+                services.push({ name: "Supabase", type: "backend", detected: "supabase dependency or supabase/ directory" });
+            }
+            // Firebase
+            if (deps?.["firebase"] || existsSync(join(projectPath, "firebase.json"))) {
+                services.push({ name: "Firebase", type: "backend", detected: "firebase dependency or firebase.json" });
+            }
+            // Prisma
+            if (deps?.["prisma"] || existsSync(join(projectPath, "prisma"))) {
+                services.push({ name: "Prisma", type: "orm", detected: "prisma dependency or prisma/ directory" });
+            }
+            // Docker
+            if (existsSync(join(projectPath, "docker-compose.yml")) || existsSync(join(projectPath, "docker-compose.yaml"))) {
+                services.push({ name: "Docker Compose", type: "infrastructure", detected: "docker-compose.yml found" });
+            }
+            // ── 5. Detect ports from config ──
+            let frontendPort = 3000; // default
+            if (framework.name === "vite")
+                frontendPort = 5173;
+            else if (framework.name === "next")
+                frontendPort = 3000;
+            else if (framework.name === "create-react-app")
+                frontendPort = 3000;
+            else if (framework.name === "nuxt")
+                frontendPort = 3000;
+            else if (framework.name === "astro")
+                frontendPort = 4321;
+            // Try to read port from vite config
+            if (framework.configFile && existsSync(join(projectPath, framework.configFile))) {
+                try {
+                    const cfgContent = readFileSync(join(projectPath, framework.configFile), "utf-8");
+                    const portMatch = cfgContent.match(/port\s*[:=]\s*(\d+)/);
+                    if (portMatch)
+                        frontendPort = parseInt(portMatch[1], 10);
+                }
+                catch { /* */ }
+            }
+            // ── 6. Check running ports ──
+            const portStatus = {};
+            if (doCheckPorts !== false) {
+                const portsToCheck = [frontendPort, 3000, 3001, 4321, 5173, 5174, 8080, 8788];
+                const uniquePorts = [...new Set(portsToCheck)];
+                await Promise.all(uniquePorts.map(async (p) => {
+                    portStatus[p] = await checkPort(p);
+                }));
+            }
+            const frontendRunning = portStatus[frontendPort] === true;
+            // ── 7. Scan routes ──
+            let routes = [];
+            if (doScanRoutes !== false) {
+                const srcDir = existsSync(join(projectPath, "src")) ? join(projectPath, "src") :
+                    existsSync(join(projectPath, "app")) ? join(projectPath, "app") : projectPath;
+                routes = extractRoutes(srcDir);
+            }
+            // ── 8. Check env files ──
+            const envFiles = [];
+            for (const name of [".env", ".env.local", ".env.development", ".env.development.local"]) {
+                if (existsSync(join(projectPath, name)))
+                    envFiles.push(name);
+            }
+            // ── 9. Build launch plan ──
+            const launchSteps = [];
+            const runningServices = [];
+            if (!frontendRunning) {
+                const devCmd = devScripts.find(s => s.likely === "frontend");
+                launchSteps.push(devCmd
+                    ? `Start frontend: npm run ${devCmd.name}  (runs: ${devCmd.command})`
+                    : `Start frontend: npm run dev  (port ${frontendPort})`);
+            }
+            else {
+                runningServices.push(`Frontend already running on port ${frontendPort}`);
+            }
+            for (const svc of services) {
+                if (svc.type === "backend") {
+                    launchSteps.push(svc.startCommand
+                        ? `Start ${svc.name}: ${svc.startCommand}`
+                        : `Start ${svc.name} (check project docs for startup command)`);
+                }
+            }
+            launchSteps.push(`Verify app is accessible at http://localhost:${frontendPort}`);
+            launchSteps.push("Then: start_ui_dive → navigate routes → discover components → test interactions");
+            return {
+                project: {
+                    name: pkg?.name ?? basename(projectPath),
+                    path: projectPath,
+                    version: pkg?.version,
+                },
+                framework,
+                devScripts,
+                services,
+                ports: {
+                    frontend: frontendPort,
+                    frontendRunning,
+                    status: portStatus,
+                },
+                routes: {
+                    count: routes.length,
+                    discovered: routes.slice(0, 50),
+                },
+                envFiles,
+                launchPlan: {
+                    alreadyRunning: runningServices,
+                    stepsNeeded: launchSteps,
+                    appUrl: `http://localhost:${frontendPort}`,
+                },
+                _hint: frontendRunning
+                    ? `App is running at http://localhost:${frontendPort}. Proceed with start_ui_dive({ appUrl: "http://localhost:${frontendPort}" }) then navigate routes with Playwright.`
+                    : `App is NOT running. Execute the launch plan steps first, then start the dive.`,
+            };
+        },
+    },
+    // ── 1. Save a labeled screenshot ──────────────────────────────────────
+    {
+        name: "dive_save_screenshot",
+        description: "Save a screenshot during a dive session. Pass base64 image data (from bridge's browser_take_screenshot) or a file path. The screenshot is stored on disk and indexed in the DB with labels, route, component, and test references. Returns a screenshot_id you can link to bugs, test steps, design issues, and changelogs. This creates the visual evidence trail for the entire dive.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                sessionId: { type: "string", description: "Dive session ID" },
+                label: { type: "string", description: "Human-readable label (e.g. 'Login form - initial state', 'After clicking submit')" },
+                base64Data: { type: "string", description: "Base64-encoded image data (from browser_take_screenshot)" },
+                filePath: { type: "string", description: "Alternative: path to an existing screenshot file" },
+                componentId: { type: "string", description: "Component this screenshot is for (optional)" },
+                route: { type: "string", description: "Current route/URL (optional)" },
+                testId: { type: "string", description: "Interaction test this belongs to (optional)" },
+                stepIndex: { type: "number", description: "Step index within a test (optional)" },
+                metadata: { type: "object", description: "Additional metadata (optional)" },
+            },
+            required: ["sessionId", "label"],
+        },
+        handler: async (args) => {
+            const { sessionId, label, base64Data, filePath, componentId, route, testId, stepIndex, metadata } = args;
+            const db = getDb();
+            const session = db.prepare("SELECT id FROM ui_dive_sessions WHERE id = ?").get(sessionId);
+            if (!session)
+                return { error: true, message: `Session not found: ${sessionId}` };
+            const id = genId("ss");
+            let savedPath = filePath ?? null;
+            // Save base64 data to disk
+            if (base64Data && !filePath) {
+                const dir = screenshotDir();
+                const filename = `${sessionId}_${id}.png`;
+                savedPath = join(dir, filename);
+                try {
+                    const buffer = Buffer.from(base64Data, "base64");
+                    writeFileSync(savedPath, buffer);
+                }
+                catch (e) {
+                    return { error: true, message: `Failed to save screenshot: ${e.message}` };
+                }
+            }
+            // Store a small thumbnail (first 500 chars of base64 for quick preview)
+            const thumbnail = base64Data ? base64Data.slice(0, 500) : null;
+            db.prepare(`INSERT INTO ui_dive_screenshots (id, session_id, component_id, test_id, step_index, label, route, file_path, base64_thumbnail, metadata)
+         VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)`).run(id, sessionId, componentId ?? null, testId ?? null, stepIndex ?? null, label, route ?? null, savedPath, thumbnail, metadata ? JSON.stringify(metadata) : null);
+            return {
+                screenshotId: id,
+                label,
+                filePath: savedPath,
+                componentId: componentId ?? null,
+                route: route ?? null,
+                _hint: `Screenshot saved. Reference it in bugs: tag_ui_bug({ screenshotRef: "${id}" }), test steps, design issues, or changelogs.`,
+            };
+        },
+    },
+    // ── 2. Run a structured interaction test ──────────────────────────────
+    {
+        name: "dive_interaction_test",
+        description: "Define and track a structured interaction test for a component. Provide preconditions and a sequence of test steps (action, target, expected outcome). The agent executes each step via the MCP Bridge (browser_click, browser_type, etc.), takes screenshots, and records actual results here. Each step gets pass/fail status. The test aggregates into an overall result. This creates the detailed walkthrough with preconditions, steps, expected vs actual, and visual evidence at each step.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                sessionId: { type: "string", description: "Dive session ID" },
+                componentId: { type: "string", description: "Component being tested" },
+                testName: { type: "string", description: "Test name (e.g. 'Login form submission', 'Dark mode toggle')" },
+                description: { type: "string", description: "What this test validates" },
+                preconditions: {
+                    type: "array",
+                    description: "List of preconditions (e.g. ['User is logged out', 'Browser at /login', 'Dark mode is off'])",
+                    items: { type: "string" },
+                },
+                steps: {
+                    type: "array",
+                    description: "Test steps to execute and track",
+                    items: {
+                        type: "object",
+                        properties: {
+                            action: { type: "string", description: "Action: click, type, navigate, hover, scroll, assert, wait, screenshot" },
+                            target: { type: "string", description: "CSS selector, URL, or description" },
+                            inputValue: { type: "string", description: "Value to type/enter (for type action)" },
+                            expected: { type: "string", description: "Expected outcome (e.g. 'Form submits', 'Error message appears', 'Redirects to /dashboard')" },
+                            screenshotLabel: { type: "string", description: "Label for the screenshot at this step (optional)" },
+                        },
+                        required: ["action", "expected"],
+                    },
+                },
+                metadata: { type: "object", description: "Optional metadata" },
+            },
+            required: ["sessionId", "componentId", "testName", "steps"],
+        },
+        handler: async (args) => {
+            const { sessionId, componentId, testName, description, preconditions, steps, metadata } = args;
+            const db = getDb();
+            const session = db.prepare("SELECT id FROM ui_dive_sessions WHERE id = ?").get(sessionId);
+            if (!session)
+                return { error: true, message: `Session not found: ${sessionId}` };
+            const comp = db.prepare("SELECT id FROM ui_dive_components WHERE id = ?").get(componentId);
+            if (!comp)
+                return { error: true, message: `Component not found: ${componentId}` };
+            const testId = genId("test");
+            db.prepare(`INSERT INTO ui_dive_interaction_tests (id, session_id, component_id, test_name, description, preconditions, steps_total, metadata)
+         VALUES (?, ?, ?, ?, ?, ?, ?, ?)`).run(testId, sessionId, componentId, testName, description ?? null, preconditions ? JSON.stringify(preconditions) : null, steps.length, metadata ? JSON.stringify(metadata) : null);
+            // Create step rows
+            const stepIds = [];
+            for (let i = 0; i < steps.length; i++) {
+                const s = steps[i];
+                const stepId = genId("step");
+                db.prepare(`INSERT INTO ui_dive_test_steps (id, test_id, step_index, action, target, input_value, expected)
+           VALUES (?, ?, ?, ?, ?, ?, ?)`).run(stepId, testId, i, s.action, s.target ?? null, s.inputValue ?? null, s.expected);
+                stepIds.push(stepId);
+            }
+            return {
+                testId,
+                testName,
+                componentId,
+                stepsTotal: steps.length,
+                stepIds,
+                status: "pending",
+                _workflow: [
+                    "For each step, the agent should:",
+                    "1. Execute the action via MCP Bridge (browser_click, browser_type, etc.)",
+                    "2. Take a screenshot via bridge (browser_take_screenshot)",
+                    "3. Save it: dive_save_screenshot({ testId, stepIndex, label, base64Data })",
+                    "4. Record result: dive_record_test_step({ testId, stepIndex, actual, status, screenshotId })",
+                    "5. After all steps: dive completes the test automatically",
+                ],
+                _hint: `Test created with ${steps.length} steps. Execute each step and record results with dive_record_test_step.`,
+            };
+        },
+    },
+    // ── 3. Record a test step result ──────────────────────────────────────
+    {
+        name: "dive_record_test_step",
+        description: "Record the actual result of a test step after executing it via the MCP Bridge. Compare expected vs actual, attach a screenshot, and mark pass/fail. When all steps are recorded, the test is automatically completed with an overall status.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                testId: { type: "string", description: "Interaction test ID from dive_interaction_test" },
+                stepIndex: { type: "number", description: "0-based step index" },
+                actual: { type: "string", description: "What actually happened" },
+                status: {
+                    type: "string",
+                    description: "Step result: passed, failed, skipped, blocked",
+                    enum: ["passed", "failed", "skipped", "blocked"],
+                },
+                screenshotId: { type: "string", description: "Screenshot ID from dive_save_screenshot (optional)" },
+                observation: { type: "string", description: "Additional notes about this step" },
+                durationMs: { type: "number", description: "How long the step took" },
+            },
+            required: ["testId", "stepIndex", "status", "actual"],
+        },
+        handler: async (args) => {
+            const { testId, stepIndex, actual, status, screenshotId, observation, durationMs } = args;
+            const db = getDb();
+            const step = db.prepare("SELECT id, expected FROM ui_dive_test_steps WHERE test_id = ? AND step_index = ?").get(testId, stepIndex);
+            if (!step)
+                return { error: true, message: `Step not found: test=${testId}, index=${stepIndex}` };
+            db.prepare("UPDATE ui_dive_test_steps SET actual = ?, status = ?, screenshot_id = ?, observation = ?, duration_ms = ? WHERE id = ?").run(actual, status, screenshotId ?? null, observation ?? null, durationMs ?? null, step.id);
+            // Check if all steps are done → auto-complete the test
+            const test = db.prepare("SELECT steps_total FROM ui_dive_interaction_tests WHERE id = ?").get(testId);
+            const completed = db.prepare("SELECT COUNT(*) as c FROM ui_dive_test_steps WHERE test_id = ? AND status != 'pending'").get(testId);
+            const passed = db.prepare("SELECT COUNT(*) as c FROM ui_dive_test_steps WHERE test_id = ? AND status = 'passed'").get(testId);
+            const failed = db.prepare("SELECT COUNT(*) as c FROM ui_dive_test_steps WHERE test_id = ? AND status = 'failed'").get(testId);
+            const allDone = completed.c >= test.steps_total;
+            if (allDone) {
+                const overallStatus = failed.c > 0 ? "failed" : "passed";
+                db.prepare("UPDATE ui_dive_interaction_tests SET status = ?, steps_passed = ?, steps_failed = ?, completed_at = datetime('now') WHERE id = ?").run(overallStatus, passed.c, failed.c, testId);
+            }
+            else {
+                db.prepare("UPDATE ui_dive_interaction_tests SET steps_passed = ?, steps_failed = ? WHERE id = ?").run(passed.c, failed.c, testId);
+            }
+            return {
+                stepId: step.id,
+                stepIndex,
+                expected: step.expected,
+                actual,
+                status,
+                match: status === "passed",
+                screenshotId: screenshotId ?? null,
+                testProgress: `${completed.c}/${test.steps_total}`,
+                testComplete: allDone,
+                ...(allDone ? { testStatus: failed.c > 0 ? "failed" : "passed" } : {}),
+                _hint: allDone
+                    ? `Test complete: ${passed.c} passed, ${failed.c} failed.`
+                    : `Step ${stepIndex} recorded. ${test.steps_total - completed.c} steps remaining.`,
+            };
+        },
+    },
+    // ── 4. Tag a design inconsistency ─────────────────────────────────────
+    {
+        name: "dive_design_issue",
+        description: "Tag a design inconsistency found during the dive. Covers visual problems like color mismatches, spacing deviations, font inconsistencies, alignment issues, contrast failures, responsive breakage, missing hover/focus states, and more. Link to a screenshot and the specific element. The agent uses bridge's browser_evaluate to extract computed styles and compare across components.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                sessionId: { type: "string", description: "Dive session ID" },
+                componentId: { type: "string", description: "Component with the issue (optional)" },
+                issueType: {
+                    type: "string",
+                    description: "Type: color, spacing, font, alignment, contrast, responsive, hover_state, focus_state, animation, icon, border, shadow, z_index, overflow, consistency",
+                },
+                severity: {
+                    type: "string",
+                    description: "Severity: critical (broken UX), high (obvious visual bug), medium (noticeable deviation), low (minor polish)",
+                    enum: ["critical", "high", "medium", "low"],
+                },
+                title: { type: "string", description: "Short description (e.g. 'Button color mismatch between header and sidebar')" },
+                description: { type: "string", description: "Detailed explanation" },
+                elementSelector: { type: "string", description: "CSS selector of the affected element" },
+                expectedValue: { type: "string", description: "What the design should be (e.g. '#3B82F6', '16px', 'Inter')" },
+                actualValue: { type: "string", description: "What was actually found (e.g. '#2563EB', '12px', 'system-ui')" },
+                screenshotId: { type: "string", description: "Screenshot showing the issue" },
+                route: { type: "string", description: "Route where the issue was found" },
+                metadata: { type: "object", description: "Additional context (e.g. { breakpoint: '768px', theme: 'dark' })" },
+            },
+            required: ["sessionId", "issueType", "title"],
+        },
+        handler: async (args) => {
+            const { sessionId, componentId, issueType, severity, title, description, elementSelector, expectedValue, actualValue, screenshotId, route, metadata } = args;
+            const db = getDb();
+            const session = db.prepare("SELECT id FROM ui_dive_sessions WHERE id = ?").get(sessionId);
+            if (!session)
+                return { error: true, message: `Session not found: ${sessionId}` };
+            const id = genId("design");
+            db.prepare(`INSERT INTO ui_dive_design_issues (id, session_id, component_id, issue_type, severity, title, description, element_selector, expected_value, actual_value, screenshot_id, route, metadata)
+         VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)`).run(id, sessionId, componentId ?? null, issueType, severity ?? "medium", title, description ?? null, elementSelector ?? null, expectedValue ?? null, actualValue ?? null, screenshotId ?? null, route ?? null, metadata ? JSON.stringify(metadata) : null);
+            return {
+                designIssueId: id,
+                issueType,
+                severity: severity ?? "medium",
+                title,
+                expectedValue: expectedValue ?? null,
+                actualValue: actualValue ?? null,
+                _hint: `Design issue tagged. View all issues in the dive report. Fix it, then track with dive_changelog.`,
+            };
+        },
+    },
+    // ── 5. Link UI component to backend context ───────────────────────────
+    {
+        name: "dive_link_backend",
+        description: "Link a UI component to its backend dependencies. Connect components to API endpoints, Convex queries/mutations/actions, database tables, auth guards, WebSocket channels, or external services. This creates the full-stack traceability map — when a UI bug is found, you can immediately see which backend code is involved.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                sessionId: { type: "string", description: "Dive session ID" },
+                componentId: { type: "string", description: "Component to link" },
+                links: {
+                    type: "array",
+                    description: "Backend references to link",
+                    items: {
+                        type: "object",
+                        properties: {
+                            linkType: {
+                                type: "string",
+                                description: "Type: convex_query, convex_mutation, convex_action, api_endpoint, db_table, auth_guard, websocket, external_service, env_var, cron_job",
+                            },
+                            path: { type: "string", description: "Path/identifier (e.g. 'api.domains.documents.documents.getSidebar', '/api/users', 'documents' table)" },
+                            description: { type: "string", description: "What this backend dependency does for the component" },
+                            method: { type: "string", description: "HTTP method for API endpoints (GET, POST, etc.)" },
+                        },
+                        required: ["linkType", "path"],
+                    },
+                },
+            },
+            required: ["sessionId", "componentId", "links"],
+        },
+        handler: async (args) => {
+            const { sessionId, componentId, links } = args;
+            const db = getDb();
+            const session = db.prepare("SELECT id FROM ui_dive_sessions WHERE id = ?").get(sessionId);
+            if (!session)
+                return { error: true, message: `Session not found: ${sessionId}` };
+            const comp = db.prepare("SELECT id, name FROM ui_dive_components WHERE id = ?").get(componentId);
+            if (!comp)
+                return { error: true, message: `Component not found: ${componentId}` };
+            const ids = [];
+            for (const link of links) {
+                const id = genId("blink");
+                db.prepare(`INSERT INTO ui_dive_backend_links (id, session_id, component_id, link_type, path, description, method)
+           VALUES (?, ?, ?, ?, ?, ?, ?)`).run(id, sessionId, componentId, link.linkType, link.path, link.description ?? null, link.method ?? null);
+                ids.push(id);
+            }
+            return {
+                componentId,
+                componentName: comp.name,
+                linksCreated: ids.length,
+                links: links.map((l, i) => ({ linkId: ids[i], ...l })),
+                _hint: `${ids.length} backend link(s) created for ${comp.name}. These will appear in the dive report and walkthrough.`,
+            };
+        },
+    },
+    // ── 6. Track a change (changelog entry) ───────────────────────────────
+    {
+        name: "dive_changelog",
+        description: "Record a change made to fix a bug, design issue, or improve a component. Links before/after screenshots to show what changed visually. Optionally references git commits and changed files. When the dive is re-run after fixes, the changelog provides a clear audit trail of what was wrong, what was changed, and how it looks now.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                sessionId: { type: "string", description: "Dive session ID" },
+                componentId: { type: "string", description: "Component that was changed (optional)" },
+                changeType: {
+                    type: "string",
+                    description: "Type: bugfix, design_fix, feature, refactor, accessibility, performance, content, responsive",
+                },
+                description: { type: "string", description: "What was changed and why" },
+                beforeScreenshotId: { type: "string", description: "Screenshot before the change (from dive_save_screenshot)" },
+                afterScreenshotId: { type: "string", description: "Screenshot after the change" },
+                filesChanged: {
+                    type: "array",
+                    description: "List of files that were modified",
+                    items: { type: "string" },
+                },
+                gitCommit: { type: "string", description: "Git commit hash (optional)" },
+                metadata: { type: "object", description: "Additional context (e.g. { bugId: '...', designIssueId: '...' })" },
+            },
+            required: ["sessionId", "changeType", "description"],
+        },
+        handler: async (args) => {
+            const { sessionId, componentId, changeType, description, beforeScreenshotId, afterScreenshotId, filesChanged, gitCommit, metadata } = args;
+            const db = getDb();
+            const session = db.prepare("SELECT id FROM ui_dive_sessions WHERE id = ?").get(sessionId);
+            if (!session)
+                return { error: true, message: `Session not found: ${sessionId}` };
+            const id = genId("chg");
+            db.prepare(`INSERT INTO ui_dive_changelogs (id, session_id, component_id, change_type, description, before_screenshot_id, after_screenshot_id, files_changed, git_commit, metadata)
+         VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)`).run(id, sessionId, componentId ?? null, changeType, description, beforeScreenshotId ?? null, afterScreenshotId ?? null, filesChanged ? JSON.stringify(filesChanged) : null, gitCommit ?? null, metadata ? JSON.stringify(metadata) : null);
+            return {
+                changelogId: id,
+                changeType,
+                description,
+                beforeScreenshotId: beforeScreenshotId ?? null,
+                afterScreenshotId: afterScreenshotId ?? null,
+                filesChanged: filesChanged ?? [],
+                gitCommit: gitCommit ?? null,
+                _hint: "Changelog entry recorded. It will appear in the dive report and walkthrough.",
+            };
+        },
+    },
+    // ── 7. Generate a complete walkthrough ────────────────────────────────
+    {
+        name: "dive_walkthrough",
+        description: "Generate a comprehensive page-by-page, component-by-component walkthrough document for a dive session. Includes: route map with source files, component tree, interaction test results with pass/fail per step, screenshots referenced at each point, design issues found, backend dependencies, console errors, and changelog entries. This is the final deliverable — a complete QA document that an agent or human can review.",
+        inputSchema: {
+            type: "object",
+            properties: {
+                sessionId: { type: "string", description: "Dive session ID" },
+                format: {
+                    type: "string",
+                    description: "Output format: markdown (readable), json (structured), summary (condensed)",
+                    enum: ["markdown", "json", "summary"],
+                },
+                includeScreenshotPaths: {
+                    type: "boolean",
+                    description: "Include file paths to screenshots (default: true)",
+                },
+            },
+            required: ["sessionId"],
+        },
+        handler: async (args) => {
+            const { sessionId, format, includeScreenshotPaths } = args;
+            const db = getDb();
+            const session = db.prepare("SELECT * FROM ui_dive_sessions WHERE id = ?").get(sessionId);
+            if (!session)
+                return { error: true, message: `Session not found: ${sessionId}` };
+            const components = db.prepare("SELECT * FROM ui_dive_components WHERE session_id = ? ORDER BY created_at").all(sessionId);
+            const bugs = db.prepare("SELECT * FROM ui_dive_bugs WHERE session_id = ? ORDER BY severity, created_at").all(sessionId);
+            const screenshots = db.prepare("SELECT * FROM ui_dive_screenshots WHERE session_id = ? ORDER BY created_at").all(sessionId);
+            const tests = db.prepare("SELECT * FROM ui_dive_interaction_tests WHERE session_id = ? ORDER BY created_at").all(sessionId);
+            const designIssues = db.prepare("SELECT * FROM ui_dive_design_issues WHERE session_id = ? ORDER BY severity, created_at").all(sessionId);
+            const backendLinks = db.prepare("SELECT * FROM ui_dive_backend_links WHERE session_id = ? ORDER BY component_id").all(sessionId);
+            const changelogs = db.prepare("SELECT * FROM ui_dive_changelogs WHERE session_id = ? ORDER BY created_at").all(sessionId);
+            // Load test steps for each test
+            const testSteps = {};
+            for (const test of tests) {
+                testSteps[test.id] = db.prepare("SELECT * FROM ui_dive_test_steps WHERE test_id = ? ORDER BY step_index").all(test.id);
+            }
+            // Group components by route (from metadata)
+            const routeGroups = new Map();
+            for (const comp of components) {
+                const meta = comp.metadata ? JSON.parse(comp.metadata) : {};
+                const route = meta.route ?? "(unrouted)";
+                if (!routeGroups.has(route))
+                    routeGroups.set(route, []);
+                routeGroups.get(route).push({ ...comp, _meta: meta });
+            }
+            if (format === "json") {
+                return {
+                    session: {
+                        id: session.id,
+                        appUrl: session.app_url,
+                        appName: session.app_name,
+                        status: session.status,
+                        createdAt: session.created_at,
+                    },
+                    stats: {
+                        routes: routeGroups.size,
+                        components: components.length,
+                        bugs: bugs.length,
+                        screenshots: screenshots.length,
+                        tests: tests.length,
+                        testsPassed: tests.filter((t) => t.status === "passed").length,
+                        testsFailed: tests.filter((t) => t.status === "failed").length,
+                        designIssues: designIssues.length,
+                        backendLinks: backendLinks.length,
+                        changelogs: changelogs.length,
+                    },
+                    routes: Object.fromEntries([...routeGroups.entries()].map(([route, comps]) => [
+                        route,
+                        {
+                            components: comps.map(c => ({
+                                id: c.id,
+                                name: c.name,
+                                type: c.component_type,
+                                status: c.status,
+                                sourceFiles: c._meta.sourceFiles ?? [],
+                                bugs: bugs.filter(b => b.component_id === c.id).map(b => ({ id: b.id, severity: b.severity, title: b.title })),
+                                backendLinks: backendLinks.filter(l => l.component_id === c.id).map(l => ({ type: l.link_type, path: l.path })),
+                                tests: tests.filter(t => t.component_id === c.id).map(t => ({
+                                    id: t.id,
+                                    name: t.test_name,
+                                    status: t.status,
+                                    passed: t.steps_passed,
+                                    failed: t.steps_failed,
+                                    total: t.steps_total,
+                                    steps: (testSteps[t.id] ?? []).map(s => ({
+                                        index: s.step_index,
+                                        action: s.action,
+                                        expected: s.expected,
+                                        actual: s.actual,
+                                        status: s.status,
+                                        screenshotId: s.screenshot_id,
+                                    })),
+                                })),
+                            })),
+                            designIssues: designIssues.filter(d => comps.some(c => c.id === d.component_id)).map(d => ({
+                                id: d.id,
+                                type: d.issue_type,
+                                severity: d.severity,
+                                title: d.title,
+                                expected: d.expected_value,
+                                actual: d.actual_value,
+                            })),
+                        },
+                    ])),
+                    changelogs: changelogs.map(c => ({
+                        id: c.id,
+                        type: c.change_type,
+                        description: c.description,
+                        filesChanged: c.files_changed ? JSON.parse(c.files_changed) : [],
+                        gitCommit: c.git_commit,
+                    })),
+                    screenshots: includeScreenshotPaths !== false
+                        ? screenshots.map(s => ({ id: s.id, label: s.label, filePath: s.file_path, route: s.route }))
+                        : undefined,
+                };
+            }
+            // Markdown format
+            const lines = [];
+            lines.push(`# UI/UX Dive Walkthrough: ${session.app_name ?? session.app_url}`);
+            lines.push(`**Session:** ${session.id}  `);
+            lines.push(`**URL:** ${session.app_url}  `);
+            lines.push(`**Date:** ${session.created_at}  `);
+            lines.push(`**Status:** ${session.status}\n`);
+            // Stats
+            lines.push("## Summary\n");
+            lines.push(`| Metric | Value |`);
+            lines.push(`|--------|-------|`);
+            lines.push(`| Routes | ${routeGroups.size} |`);
+            lines.push(`| Components | ${components.length} |`);
+            lines.push(`| Interaction Tests | ${tests.length} (${tests.filter((t) => t.status === "passed").length} passed, ${tests.filter((t) => t.status === "failed").length} failed) |`);
+            lines.push(`| Bugs | ${bugs.length} |`);
+            lines.push(`| Design Issues | ${designIssues.length} |`);
+            lines.push(`| Screenshots | ${screenshots.length} |`);
+            lines.push(`| Backend Links | ${backendLinks.length} |`);
+            lines.push(`| Changelogs | ${changelogs.length} |`);
+            lines.push("");
+            // Route-by-route walkthrough
+            lines.push("## Route-by-Route Walkthrough\n");
+            for (const [route, comps] of routeGroups) {
+                const sourceFiles = comps[0]?._meta?.sourceFiles ?? [];
+                lines.push(`### ${route}\n`);
+                if (sourceFiles.length > 0)
+                    lines.push(`**Source files:** ${sourceFiles.join(", ")}  `);
+                lines.push(`**Components:** ${comps.length}\n`);
+                for (const comp of comps) {
+                    lines.push(`#### ${comp.name} (${comp.component_type})`);
+                    lines.push(`- **Status:** ${comp.status}`);
+                    lines.push(`- **Interactions:** ${comp.interaction_count}`);
+                    // Backend links
+                    const compLinks = backendLinks.filter(l => l.component_id === comp.id);
+                    if (compLinks.length > 0) {
+                        lines.push(`- **Backend dependencies:**`);
+                        for (const link of compLinks) {
+                            lines.push(`  - \`[${link.link_type}]\` ${link.path}${link.description ? ` -- ${link.description}` : ""}`);
+                        }
+                    }
+                    // Tests for this component
+                    const compTests = tests.filter(t => t.component_id === comp.id);
+                    if (compTests.length > 0) {
+                        lines.push(`\n**Interaction Tests:**\n`);
+                        for (const test of compTests) {
+                            const icon = test.status === "passed" ? "PASS" : test.status === "failed" ? "FAIL" : "PENDING";
+                            lines.push(`##### [${icon}] ${test.test_name}`);
+                            if (test.description)
+                                lines.push(`${test.description}`);
+                            if (test.preconditions) {
+                                const preconds = JSON.parse(test.preconditions);
+                                lines.push(`\n**Preconditions:**`);
+                                for (const p of preconds)
+                                    lines.push(`- ${p}`);
+                            }
+                            lines.push(`\n| Step | Action | Expected | Actual | Status | Screenshot |`);
+                            lines.push(`|------|--------|----------|--------|--------|------------|`);
+                            for (const step of (testSteps[test.id] ?? [])) {
+                                const stepIcon = step.status === "passed" ? "PASS" : step.status === "failed" ? "FAIL" : step.status;
+                                const ssRef = step.screenshot_id ?? "-";
+                                lines.push(`| ${step.step_index} | ${step.action} ${step.target ?? ""} | ${step.expected ?? ""} | ${step.actual ?? "-"} | ${stepIcon} | ${ssRef} |`);
+                            }
+                            lines.push("");
+                        }
+                    }
+                    // Bugs
+                    const compBugs = bugs.filter(b => b.component_id === comp.id);
+                    if (compBugs.length > 0) {
+                        lines.push(`\n**Bugs:**\n`);
+                        for (const bug of compBugs) {
+                            lines.push(`- **[${bug.severity.toUpperCase()}]** ${bug.title}`);
+                            if (bug.description)
+                                lines.push(`  ${bug.description}`);
+                            if (bug.screenshot_ref)
+                                lines.push(`  Screenshot: ${bug.screenshot_ref}`);
+                        }
+                    }
+                    lines.push("");
+                }
+                // Design issues for this route
+                const routeDesignIssues = designIssues.filter(d => d.route === route);
+                if (routeDesignIssues.length > 0) {
+                    lines.push(`**Design Issues on ${route}:**\n`);
+                    for (const issue of routeDesignIssues) {
+                        lines.push(`- **[${issue.severity.toUpperCase()}] ${issue.issue_type}:** ${issue.title}`);
+                        if (issue.expected_value || issue.actual_value) {
+                            lines.push(`  Expected: ${issue.expected_value ?? "?"} | Actual: ${issue.actual_value ?? "?"}`);
+                        }
+                    }
+                    lines.push("");
+                }
+            }
+            // Changelog
+            if (changelogs.length > 0) {
+                lines.push("## Changelog\n");
+                for (const chg of changelogs) {
+                    lines.push(`### [${chg.change_type}] ${chg.description}`);
+                    if (chg.files_changed) {
+                        const files = JSON.parse(chg.files_changed);
+                        lines.push(`**Files changed:** ${files.join(", ")}`);
+                    }
+                    if (chg.git_commit)
+                        lines.push(`**Commit:** ${chg.git_commit}`);
+                    if (chg.before_screenshot_id || chg.after_screenshot_id) {
+                        lines.push(`**Before:** ${chg.before_screenshot_id ?? "-"} | **After:** ${chg.after_screenshot_id ?? "-"}`);
+                    }
+                    lines.push("");
+                }
+            }
+            const markdown = lines.join("\n");
+            return {
+                format: "markdown",
+                walkthrough: format === "summary" ? markdown.slice(0, 3000) : markdown,
+                stats: {
+                    routes: routeGroups.size,
+                    components: components.length,
+                    tests: tests.length,
+                    bugs: bugs.length,
+                    designIssues: designIssues.length,
+                    screenshots: screenshots.length,
+                    backendLinks: backendLinks.length,
+                    changelogs: changelogs.length,
+                },
+            };
+        },
+    },
+];
+//# sourceMappingURL=uiUxDiveAdvancedTools.js.map