npm - retestkit - Versions diffs - 1.4.1 → 1.5.0 - Mend

retestkit 1.4.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (238) hide show

package/README.md +59 -40
package/dist/config.js +8 -8
package/dist/config.js.map +1 -1
package/dist/logger.js +1 -1
package/dist/logger.js.map +1 -1
package/dist/prompts/index.d.ts +1 -1
package/dist/prompts/index.d.ts.map +1 -1
package/dist/prompts/index.js +21 -21
package/dist/prompts/index.js.map +1 -1
package/dist/prompts/templates/mcp/retest-crawl.md +7 -0
package/{src/prompts/templates/mcp/webtest-discover-flows.md → dist/prompts/templates/mcp/retest-discover-flows.md} +1 -1
package/{src/prompts/templates/mcp/webtest-discover.md → dist/prompts/templates/mcp/retest-discover.md} +2 -2
package/dist/prompts/templates/mcp/retest-full-workflow.md +12 -0
package/{src/prompts/templates/mcp/webtest-generate-tests.md → dist/prompts/templates/mcp/retest-generate-tests.md} +1 -1
package/{src/prompts/templates/mcp/webtest-run-test.md → dist/prompts/templates/mcp/retest-run-test.md} +1 -1
package/{src/prompts/templates/mcp/webtest-start.md → dist/prompts/templates/mcp/retest-start.md} +1 -1
package/{src → dist}/prompts/templates/sampling/system-prefix.md +1 -1
package/dist/resources/index.js +7 -7
package/dist/resources/index.js.map +1 -1
package/dist/schemas/config.js +2 -2
package/dist/schemas/config.js.map +1 -1
package/dist/security/index.js +1 -1
package/dist/security/index.js.map +1 -1
package/dist/server.js +3 -3
package/dist/server.js.map +1 -1
package/dist/test-utils/mock-context.js +22 -22
package/dist/test-utils/mock-context.js.map +1 -1
package/dist/tools/index.d.ts +1 -1
package/dist/tools/index.d.ts.map +1 -1
package/dist/tools/index.js +5 -5
package/dist/tools/index.js.map +1 -1
package/dist/tools/retest/crawl.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/crawl.js +7 -7
package/dist/tools/retest/crawl.js.map +1 -0
package/dist/tools/retest/discover-features.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-features.js +6 -6
package/dist/tools/retest/discover-features.js.map +1 -0
package/dist/tools/retest/discover-flows.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-flows.js +6 -6
package/dist/tools/retest/discover-flows.js.map +1 -0
package/dist/tools/retest/generate-tests.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/generate-tests.js +5 -5
package/dist/tools/retest/generate-tests.js.map +1 -0
package/dist/tools/retest/index.d.ts.map +1 -0
package/dist/tools/retest/index.js.map +1 -0
package/dist/tools/retest/run-test-case.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/run-test-case.js +3 -3
package/dist/tools/retest/run-test-case.js.map +1 -0
package/dist/tools/retest/schemas.d.ts.map +1 -0
package/dist/tools/retest/schemas.js.map +1 -0
package/dist/tools/retest/start-analysis.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/start-analysis.js +5 -5
package/dist/tools/retest/start-analysis.js.map +1 -0
package/dist/workspace/index.js +8 -8
package/dist/workspace/index.js.map +1 -1
package/dist/workspace/types.d.ts +2 -2
package/dist/workspace/types.d.ts.map +1 -1
package/package.json +6 -2
package/.claude/commands/openspec/apply.md +0 -23
package/.claude/commands/openspec/archive.md +0 -27
package/.claude/commands/openspec/proposal.md +0 -28
package/.gemini/commands/openspec/apply.toml +0 -21
package/.gemini/commands/openspec/archive.toml +0 -25
package/.gemini/commands/openspec/proposal.toml +0 -26
package/.github/prompts/openspec-apply.prompt.md +0 -22
package/.github/prompts/openspec-archive.prompt.md +0 -26
package/.github/prompts/openspec-proposal.prompt.md +0 -27
package/.github/workflows/release.yml +0 -33
package/.kilocode/workflows/openspec-apply.md +0 -17
package/.kilocode/workflows/openspec-archive.md +0 -21
package/.kilocode/workflows/openspec-proposal.md +0 -22
package/.mcp.json +0 -23
package/.opencode/command/openspec-apply.md +0 -25
package/.opencode/command/openspec-archive.md +0 -28
package/.opencode/command/openspec-proposal.md +0 -30
package/.roo/commands/openspec-apply.md +0 -20
package/.roo/commands/openspec-archive.md +0 -24
package/.roo/commands/openspec-proposal.md +0 -25
package/.vscode/mcp.json +0 -23
package/AGENTS.md +0 -18
package/CLAUDE.md +0 -18
package/dist/tools/webtest/crawl.d.ts.map +0 -1
package/dist/tools/webtest/crawl.js.map +0 -1
package/dist/tools/webtest/discover-features.d.ts.map +0 -1
package/dist/tools/webtest/discover-features.js.map +0 -1
package/dist/tools/webtest/discover-flows.d.ts.map +0 -1
package/dist/tools/webtest/discover-flows.js.map +0 -1
package/dist/tools/webtest/generate-tests.d.ts.map +0 -1
package/dist/tools/webtest/generate-tests.js.map +0 -1
package/dist/tools/webtest/index.d.ts.map +0 -1
package/dist/tools/webtest/index.js.map +0 -1
package/dist/tools/webtest/run-test-case.d.ts.map +0 -1
package/dist/tools/webtest/run-test-case.js.map +0 -1
package/dist/tools/webtest/schemas.d.ts.map +0 -1
package/dist/tools/webtest/schemas.js.map +0 -1
package/dist/tools/webtest/start-analysis.d.ts.map +0 -1
package/dist/tools/webtest/start-analysis.js.map +0 -1
package/openspec/AGENTS.md +0 -456
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/proposal.md +0 -33
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-resources/spec.md +0 -27
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-tools/spec.md +0 -304
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/tasks.md +0 -43
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/design.md +0 -209
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/proposal.md +0 -41
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/specs/mcp-server-core/spec.md +0 -183
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/tasks.md +0 -112
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/design.md +0 -333
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/proposal.md +0 -66
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/mcp-server-core/spec.md +0 -129
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-lifecycle/spec.md +0 -138
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-logging/spec.md +0 -211
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-prompts/spec.md +0 -157
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-resources/spec.md +0 -213
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-sampling/spec.md +0 -257
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-tools/spec.md +0 -501
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/tasks.md +0 -264
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/proposal.md +0 -24
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/specs/webtest-tools/spec.md +0 -80
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/tasks.md +0 -8
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/design.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/proposal.md +0 -28
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/specs/webtest-sampling/spec.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/tasks.md +0 -33
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/design.md +0 -558
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/proposal.md +0 -119
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-resources/spec.md +0 -109
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-tools/spec.md +0 -121
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/tasks.md +0 -133
package/openspec/changes/extract-prompts-to-markdown/design.md +0 -86
package/openspec/changes/extract-prompts-to-markdown/proposal.md +0 -50
package/openspec/changes/extract-prompts-to-markdown/specs/webtest-prompts/spec.md +0 -74
package/openspec/changes/extract-prompts-to-markdown/tasks.md +0 -40
package/openspec/changes/refactor-webtest-naming/design.md +0 -95
package/openspec/changes/refactor-webtest-naming/proposal.md +0 -66
package/openspec/changes/refactor-webtest-naming/specs/webtest-prompts/spec.md +0 -79
package/openspec/changes/refactor-webtest-naming/specs/webtest-resources/spec.md +0 -80
package/openspec/changes/refactor-webtest-naming/specs/webtest-sampling/spec.md +0 -122
package/openspec/changes/refactor-webtest-naming/specs/webtest-tools/spec.md +0 -113
package/openspec/changes/refactor-webtest-naming/tasks.md +0 -119
package/openspec/changes/rename-package-to-retest/proposal.md +0 -52
package/openspec/changes/rename-package-to-retest/specs/mcp-server-core/spec.md +0 -53
package/openspec/changes/rename-package-to-retest/specs/retest-lifecycle/spec.md +0 -68
package/openspec/changes/rename-package-to-retest/specs/retest-logging/spec.md +0 -35
package/openspec/changes/rename-package-to-retest/specs/retest-prompts/spec.md +0 -159
package/openspec/changes/rename-package-to-retest/specs/retest-resources/spec.md +0 -251
package/openspec/changes/rename-package-to-retest/specs/retest-sampling/spec.md +0 -99
package/openspec/changes/rename-package-to-retest/specs/retest-tools/spec.md +0 -295
package/openspec/changes/rename-package-to-retest/tasks.md +0 -71
package/openspec/project.md +0 -31
package/openspec/specs/mcp-server-core/spec.md +0 -178
package/openspec/specs/webtest-lifecycle/spec.md +0 -136
package/openspec/specs/webtest-logging/spec.md +0 -209
package/openspec/specs/webtest-prompts/spec.md +0 -155
package/openspec/specs/webtest-resources/spec.md +0 -248
package/openspec/specs/webtest-sampling/spec.md +0 -344
package/openspec/specs/webtest-tools/spec.md +0 -282
package/release.config.js +0 -9
package/src/config.test.ts +0 -96
package/src/config.ts +0 -32
package/src/elicitation/index.test.ts +0 -399
package/src/elicitation/index.ts +0 -171
package/src/elicitation/types.ts +0 -68
package/src/index.ts +0 -83
package/src/lifecycle/index.test.ts +0 -260
package/src/lifecycle/index.ts +0 -101
package/src/logger.redaction.test.ts +0 -322
package/src/logger.test.ts +0 -123
package/src/logger.ts +0 -229
package/src/playwright-client/index.ts +0 -392
package/src/playwright-client/types.ts +0 -99
package/src/progress/index.test.ts +0 -327
package/src/progress/index.ts +0 -170
package/src/progress/types.ts +0 -25
package/src/prompts/index.test.ts +0 -451
package/src/prompts/index.ts +0 -246
package/src/prompts/loader.test.ts +0 -100
package/src/prompts/loader.ts +0 -59
package/src/prompts/templates/mcp/webtest-crawl.md +0 -7
package/src/prompts/templates/mcp/webtest-full-workflow.md +0 -12
package/src/resources/index.ts +0 -250
package/src/resources/subscriptions.ts +0 -37
package/src/sampling/index.test.ts +0 -414
package/src/sampling/index.ts +0 -286
package/src/sampling/prompts.ts +0 -194
package/src/sampling/types.ts +0 -60
package/src/schemas/config.ts +0 -39
package/src/security/index.test.ts +0 -441
package/src/security/index.ts +0 -361
package/src/security/security-scenarios.test.ts +0 -468
package/src/server.ts +0 -211
package/src/test-utils/index.ts +0 -6
package/src/test-utils/mock-context.ts +0 -426
package/src/test-utils/mock-playwright-client.ts +0 -422
package/src/tools/index.ts +0 -11
package/src/tools/webtest/crawl.test.ts +0 -834
package/src/tools/webtest/crawl.ts +0 -901
package/src/tools/webtest/discover-features.ts +0 -412
package/src/tools/webtest/discover-flows.ts +0 -408
package/src/tools/webtest/generate-tests.test.ts +0 -532
package/src/tools/webtest/generate-tests.ts +0 -425
package/src/tools/webtest/index.ts +0 -7
package/src/tools/webtest/integration.test.ts +0 -536
package/src/tools/webtest/run-test-case.test.ts +0 -659
package/src/tools/webtest/run-test-case.ts +0 -508
package/src/tools/webtest/schemas.ts +0 -201
package/src/tools/webtest/start-analysis.test.ts +0 -151
package/src/tools/webtest/start-analysis.ts +0 -158
package/src/transports/http.ts +0 -19
package/src/transports/index.ts +0 -30
package/src/transports/stdio.ts +0 -7
package/src/types/capabilities.test.ts +0 -193
package/src/types/capabilities.ts +0 -50
package/src/types/context.ts +0 -21
package/src/types/tool.ts +0 -11
package/src/workspace/index.ts +0 -945
package/src/workspace/markdown.ts +0 -272
package/src/workspace/types.ts +0 -186
package/tests/integration/server.test.ts +0 -89
package/tests/integration/tools.test.ts +0 -99
package/tsconfig.json +0 -20
package/vitest.config.ts +0 -9
package/vitest.integration.config.ts +0 -10
/package/{src → dist}/prompts/templates/sampling/crawl-action.md +0 -0
/package/{src → dist}/prompts/templates/sampling/feature-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/flow-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/page-content-wrapper.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-evaluation.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-generation.md +0 -0
/package/dist/tools/{webtest → retest}/crawl.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-features.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-flows.d.ts +0 -0
/package/dist/tools/{webtest → retest}/generate-tests.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.js +0 -0
/package/dist/tools/{webtest → retest}/run-test-case.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.js +0 -0
/package/dist/tools/{webtest → retest}/start-analysis.d.ts +0 -0

package/src/tools/webtest/run-test-case.test.ts DELETED Viewed

@@ -1,659 +0,0 @@
-/**
- * Unit Tests for webtest_run_tests tool (Phase 7.8)
- */
-import { describe, it, expect, vi, beforeEach } from "vitest";
-import { createRunTestCaseTool } from "./run-test-case.js";
-import {
-  createMockContext,
-  type MockContext,
-} from "../../test-utils/index.js";
-describe("webtest_run_tests", () => {
-  let context: MockContext;
-  let tool: ReturnType<typeof createRunTestCaseTool>;
-  beforeEach(() => {
-    context = createMockContext();
-    tool = createRunTestCaseTool(() => context as any);
-    // Set up workspace with tests
-    context.workspaceManager.readWorkspaceIndex = vi.fn().mockResolvedValue({
-      url: "https://shop.example.com",
-      domain: "shop.example.com",
-      focus: "Test checkout flow",
-      crawls: [],
-      analysis: {
-        appAnalysisUri: "webtest://test/analysis/app-analysis.md",
-        flowsUri: "webtest://test/analysis/flows.md",
-      },
-      tests: {
-        testsUri: "webtest://test/tests/tests.md",
-        testCount: 2,
-      },
-      runs: [],
-      limits: { maxSteps: 100, maxMinutes: 30, maxPages: 50 },
-    });
-    // Set up resource reading for tests (markdown with YAML frontmatter)
-    context.resourceManager.readResource = vi.fn().mockResolvedValue({
-      text: `---
-tests:
-  - id: test-browse-001
-    name: Browse products successfully
-    category: happy_path
-    purpose: Verify user can browse product list
-    preconditions:
-      - User is on home page
-    steps:
-      - stepNumber: 1
-        action: Click
-        target: a.products-link
-        expected: Products page loads
-      - stepNumber: 2
-        action: Verify
-        expected: Product list is visible
-    expectedOutcomes:
-      - Products page is displayed
-    tags:
-      - browse
-  - id: test-checkout-001
-    name: Complete checkout
-    category: happy_path
-    purpose: Verify user can complete checkout
-    preconditions: []
-    steps:
-      - stepNumber: 1
-        action: Navigate to
-        target: /cart
-        expected: Cart page loads
-    expectedOutcomes:
-      - Order is placed
-    tags:
-      - checkout
----
-# Test Cases
-## Browse products successfully
-...
-`,
-    });
-    // Set up evaluation result
-    context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-      success: true,
-      data: {
-        passed: true,
-        reasoning: "Expected outcome matched",
-        confidence: 0.95,
-      },
-    });
-    // Connect playwright
-    context.playwrightClient.isConnected = vi.fn().mockReturnValue(true);
-  });
-  describe("tool metadata", () => {
-    it("has correct name", () => {
-      expect(tool.name).toBe("webtest_run_test");
-    });
-    it("has a description", () => {
-      expect(tool.description).toBeDefined();
-      expect(tool.description.length).toBeGreaterThan(0);
-    });
-    it("has an input schema", () => {
-      expect(tool.inputSchema).toBeDefined();
-    });
-  });
-  describe("handler - validation", () => {
-    it("returns error for non-existent workspace", async () => {
-      context.workspaceManager.workspaceExists = vi.fn().mockResolvedValue(false);
-      const result = await tool.handler({
-        analysisId: "00000000-0000-0000-0000-000000000000",
-        testCaseId: "test-1",
-      });
-      expect(result.isError).toBe(true);
-      expect(result.content[0].text).toContain("not found");
-    });
-    it("returns error when no tests exist", async () => {
-      context.workspaceManager.readWorkspaceIndex = vi.fn().mockResolvedValue({
-        url: "https://example.com",
-        domain: "example.com",
-        crawls: [],
-        analysis: null,
-        tests: null,
-        runs: [],
-        limits: { maxSteps: 100, maxMinutes: 30, maxPages: 50 },
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-1",
-      });
-      expect(result.isError).toBe(true);
-      expect(result.content[0].text).toContain("No tests found");
-    });
-    it("returns error for non-existent test case", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "non-existent-test",
-      });
-      expect(result.isError).toBe(true);
-      expect(result.content[0].text).toContain("not found");
-      expect(result.content[0].text).toContain("Available tests");
-    });
-    it("returns error when tests fail to load", async () => {
-      context.resourceManager.readResource = vi.fn().mockRejectedValue(
-        new Error("File not found")
-      );
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(result.isError).toBe(true);
-      expect(result.content[0].text).toContain("Error loading");
-    });
-  });
-  describe("handler - test execution", () => {
-    it("creates test run in workspace", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.workspaceManager.createTestRun).toHaveBeenCalledWith(
-        context.testAnalysisId,
-        expect.objectContaining({
-          testCaseId: "test-browse-001",
-          testName: "Browse products successfully",
-        })
-      );
-    });
-    it("connects to playwright if not connected", async () => {
-      context.playwrightClient.isConnected = vi.fn().mockReturnValue(false);
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.playwrightClient.connect).toHaveBeenCalled();
-    });
-    it("navigates to workspace URL first", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.playwrightClient.navigate).toHaveBeenCalledWith(
-        "https://shop.example.com"
-      );
-    });
-    it("executes click actions", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      // When no element/ref provided, falls back to target as element with empty ref
-      expect(context.playwrightClient.click).toHaveBeenCalledWith("a.products-link", "");
-    });
-    it("returns runId in response", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.runId).toBeDefined();
-    });
-    it("returns test status", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBeDefined();
-      expect(["passed", "failed", "error"]).toContain(content.status);
-    });
-    it("returns step results", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.stepResults).toBeInstanceOf(Array);
-      expect(content.stepResults.length).toBeGreaterThan(0);
-    });
-    it("returns summary with step counts", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.summary).toBeDefined();
-      expect(content.summary.totalSteps).toBeGreaterThan(0);
-      expect(content.summary.passed).toBeDefined();
-    });
-  });
-  describe("handler - evidence capture", () => {
-    it("captures screenshot at each step by default", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.playwrightClient.screenshot).toHaveBeenCalled();
-    });
-    it("captures snapshot at each step by default", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.playwrightClient.snapshot).toHaveBeenCalled();
-    });
-    it("saves evidence to workspace", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.workspaceManager.saveTestStepEvidence).toHaveBeenCalled();
-    });
-    it("skips evidence when captureEvidence is false", async () => {
-      vi.clearAllMocks();
-      // Need to re-mock after clear
-      context.playwrightClient.navigate = vi.fn().mockResolvedValue(undefined);
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-        runOptions: {
-          captureEvidence: false,
-          stopOnFailure: true,
-          retryFailedSteps: false,
-        },
-      });
-      expect(context.workspaceManager.saveTestStepEvidence).not.toHaveBeenCalled();
-    });
-  });
-  describe("handler - assertion evaluation", () => {
-    it("evaluates step assertions via sampling", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.samplingClient.createMessage).toHaveBeenCalled();
-    });
-    it("marks step as failed when assertion fails", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          passed: false,
-          reasoning: "Expected product list but saw error page",
-          confidence: 0.9,
-        },
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBe("failed");
-    });
-    it("continues without sampling when unavailable", async () => {
-      context.samplingClient.hasSampling = vi.fn().mockReturnValue(false);
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      // Should still pass (no assertion evaluation)
-      expect(result.isError).toBeFalsy();
-    });
-  });
-  describe("handler - stop on failure", () => {
-    it("stops on first failure by default", async () => {
-      context.playwrightClient.click = vi.fn()
-        .mockRejectedValueOnce(new Error("Element not found"))
-        .mockResolvedValue(undefined);
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBe("error");
-      expect(content.summary.skipped).toBeGreaterThan(0);
-    });
-    it("continues on failure when stopOnFailure is false", async () => {
-      context.playwrightClient.click = vi.fn()
-        .mockRejectedValueOnce(new Error("Element not found"))
-        .mockResolvedValue(undefined);
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-        runOptions: {
-          captureEvidence: true,
-          stopOnFailure: false,
-          retryFailedSteps: false,
-        },
-      });
-      const content = JSON.parse(result.content[0].text!);
-      // All steps should have been attempted
-      expect(content.summary.skipped).toBe(0);
-    });
-  });
-  describe("handler - retry failed steps", () => {
-    it("retries failed steps when enabled", async () => {
-      let callCount = 0;
-      context.playwrightClient.click = vi.fn().mockImplementation(() => {
-        callCount++;
-        if (callCount === 1) {
-          return Promise.reject(new Error("Transient error"));
-        }
-        return Promise.resolve();
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-        runOptions: {
-          captureEvidence: true,
-          stopOnFailure: true,
-          retryFailedSteps: true,
-        },
-      });
-      // Should have retried and passed
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBe("passed");
-    });
-  });
-  describe("handler - cancellation", () => {
-    it("handles cancellation gracefully", async () => {
-      const { CancellationError } = await import("../../progress/index.js");
-      context.cancellationRegistry.checkCancelled = vi.fn().mockImplementation((id) => {
-        throw new CancellationError(id);
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(result.isError).toBeFalsy();
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBe("cancelled");
-    });
-    it("registers for cancellation on start", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.cancellationRegistry.register).toHaveBeenCalled();
-    });
-    it("unregisters cancellation on completion", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.cancellationRegistry.unregister).toHaveBeenCalled();
-    });
-  });
-  describe("handler - progress reporting", () => {
-    it("emits progress for each step", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.progressEmitter.emit).toHaveBeenCalled();
-    });
-    it("includes step info in progress", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.progressEmitter.emit).toHaveBeenCalledWith(
-        expect.objectContaining({
-          progress: expect.any(Number),
-          total: expect.any(Number),
-          message: expect.stringContaining("Step"),
-        })
-      );
-    });
-  });
-  describe("handler - resource notifications", () => {
-    it("notifies on test run creation", async () => {
-      vi.clearAllMocks();
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.resourceManager.notifyListChanged).toHaveBeenCalled();
-    });
-  });
-  describe("handler - action execution", () => {
-    it("executes navigate actions", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-checkout-001",
-      });
-      expect(context.playwrightClient.navigate).toHaveBeenCalledWith("/cart");
-    });
-    it("handles type actions", async () => {
-      context.resourceManager.readResource = vi.fn().mockResolvedValue({
-        text: `---
-tests:
-  - id: test-type-001
-    name: Type in field
-    category: happy_path
-    purpose: Test typing
-    preconditions: []
-    steps:
-      - stepNumber: 1
-        action: Type
-        target: input.search
-        value: test query
-    expectedOutcomes:
-      - Text is entered
----
-# Test Cases
-...
-`,
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-type-001",
-      });
-      // When no element/ref provided, falls back to target as element with empty ref
-      expect(context.playwrightClient.type).toHaveBeenCalledWith("input.search", "", "test query");
-    });
-    it("handles fill actions", async () => {
-      context.resourceManager.readResource = vi.fn().mockResolvedValue({
-        text: `---
-tests:
-  - id: test-fill-001
-    name: Fill field
-    category: happy_path
-    purpose: Test filling
-    preconditions: []
-    steps:
-      - stepNumber: 1
-        action: Fill
-        target: input.email
-        value: test@example.com
-    expectedOutcomes:
-      - Field is filled
----
-# Test Cases
-...
-`,
-      });
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-fill-001",
-      });
-      // When no element/ref provided, falls back to target as element with empty ref
-      expect(context.playwrightClient.fill).toHaveBeenCalledWith("input.email", "", "test@example.com");
-    });
-  });
-  describe("handler - error handling", () => {
-    it("handles playwright connection errors", async () => {
-      context.playwrightClient.isConnected = vi.fn().mockReturnValue(false);
-      context.playwrightClient.connect = vi.fn().mockRejectedValue(
-        new Error("Connection failed")
-      );
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(result.isError).toBe(true);
-    });
-    it("handles step execution errors", async () => {
-      context.playwrightClient.click = vi.fn().mockRejectedValue(
-        new Error("Element not found")
-      );
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.status).toBe("error");
-      expect(content.stepResults[0].errorMessage).toBeDefined();
-    });
-  });
-  describe("handler - next steps", () => {
-    it("returns success next steps when test passes", async () => {
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.nextSteps).toBeInstanceOf(Array);
-      expect(content.nextSteps.some((s: string) => s.includes("passed"))).toBe(true);
-    });
-    it("returns investigation steps when test fails", async () => {
-      context.samplingClient.createMessage = vi.fn().mockResolvedValue({
-        success: true,
-        data: {
-          passed: false,
-          reasoning: "Element not visible",
-          confidence: 0.9,
-        },
-      });
-      const result = await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      const content = JSON.parse(result.content[0].text!);
-      expect(content.nextSteps.some((s: string) => s.includes("Investigate"))).toBe(true);
-    });
-  });
-  describe("handler - logging", () => {
-    it("logs test execution start", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.logger.info).toHaveBeenCalledWith(
-        expect.stringContaining("test case"),
-        expect.any(Object)
-      );
-    });
-    it("logs completion with results", async () => {
-      await tool.handler({
-        analysisId: context.testAnalysisId,
-        testCaseId: "test-browse-001",
-      });
-      expect(context.logger.info).toHaveBeenCalledWith(
-        expect.stringContaining("completed"),
-        expect.objectContaining({
-          status: expect.any(String),
-        })
-      );
-    });
-  });
-});