npm - retestkit - Versions diffs - 1.4.1 → 1.5.0 - Mend

retestkit 1.4.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (238) hide show

package/README.md +59 -40
package/dist/config.js +8 -8
package/dist/config.js.map +1 -1
package/dist/logger.js +1 -1
package/dist/logger.js.map +1 -1
package/dist/prompts/index.d.ts +1 -1
package/dist/prompts/index.d.ts.map +1 -1
package/dist/prompts/index.js +21 -21
package/dist/prompts/index.js.map +1 -1
package/dist/prompts/templates/mcp/retest-crawl.md +7 -0
package/{src/prompts/templates/mcp/webtest-discover-flows.md → dist/prompts/templates/mcp/retest-discover-flows.md} +1 -1
package/{src/prompts/templates/mcp/webtest-discover.md → dist/prompts/templates/mcp/retest-discover.md} +2 -2
package/dist/prompts/templates/mcp/retest-full-workflow.md +12 -0
package/{src/prompts/templates/mcp/webtest-generate-tests.md → dist/prompts/templates/mcp/retest-generate-tests.md} +1 -1
package/{src/prompts/templates/mcp/webtest-run-test.md → dist/prompts/templates/mcp/retest-run-test.md} +1 -1
package/{src/prompts/templates/mcp/webtest-start.md → dist/prompts/templates/mcp/retest-start.md} +1 -1
package/{src → dist}/prompts/templates/sampling/system-prefix.md +1 -1
package/dist/resources/index.js +7 -7
package/dist/resources/index.js.map +1 -1
package/dist/schemas/config.js +2 -2
package/dist/schemas/config.js.map +1 -1
package/dist/security/index.js +1 -1
package/dist/security/index.js.map +1 -1
package/dist/server.js +3 -3
package/dist/server.js.map +1 -1
package/dist/test-utils/mock-context.js +22 -22
package/dist/test-utils/mock-context.js.map +1 -1
package/dist/tools/index.d.ts +1 -1
package/dist/tools/index.d.ts.map +1 -1
package/dist/tools/index.js +5 -5
package/dist/tools/index.js.map +1 -1
package/dist/tools/retest/crawl.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/crawl.js +7 -7
package/dist/tools/retest/crawl.js.map +1 -0
package/dist/tools/retest/discover-features.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-features.js +6 -6
package/dist/tools/retest/discover-features.js.map +1 -0
package/dist/tools/retest/discover-flows.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/discover-flows.js +6 -6
package/dist/tools/retest/discover-flows.js.map +1 -0
package/dist/tools/retest/generate-tests.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/generate-tests.js +5 -5
package/dist/tools/retest/generate-tests.js.map +1 -0
package/dist/tools/retest/index.d.ts.map +1 -0
package/dist/tools/retest/index.js.map +1 -0
package/dist/tools/retest/run-test-case.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/run-test-case.js +3 -3
package/dist/tools/retest/run-test-case.js.map +1 -0
package/dist/tools/retest/schemas.d.ts.map +1 -0
package/dist/tools/retest/schemas.js.map +1 -0
package/dist/tools/retest/start-analysis.d.ts.map +1 -0
package/dist/tools/{webtest → retest}/start-analysis.js +5 -5
package/dist/tools/retest/start-analysis.js.map +1 -0
package/dist/workspace/index.js +8 -8
package/dist/workspace/index.js.map +1 -1
package/dist/workspace/types.d.ts +2 -2
package/dist/workspace/types.d.ts.map +1 -1
package/package.json +6 -2
package/.claude/commands/openspec/apply.md +0 -23
package/.claude/commands/openspec/archive.md +0 -27
package/.claude/commands/openspec/proposal.md +0 -28
package/.gemini/commands/openspec/apply.toml +0 -21
package/.gemini/commands/openspec/archive.toml +0 -25
package/.gemini/commands/openspec/proposal.toml +0 -26
package/.github/prompts/openspec-apply.prompt.md +0 -22
package/.github/prompts/openspec-archive.prompt.md +0 -26
package/.github/prompts/openspec-proposal.prompt.md +0 -27
package/.github/workflows/release.yml +0 -33
package/.kilocode/workflows/openspec-apply.md +0 -17
package/.kilocode/workflows/openspec-archive.md +0 -21
package/.kilocode/workflows/openspec-proposal.md +0 -22
package/.mcp.json +0 -23
package/.opencode/command/openspec-apply.md +0 -25
package/.opencode/command/openspec-archive.md +0 -28
package/.opencode/command/openspec-proposal.md +0 -30
package/.roo/commands/openspec-apply.md +0 -20
package/.roo/commands/openspec-archive.md +0 -24
package/.roo/commands/openspec-proposal.md +0 -25
package/.vscode/mcp.json +0 -23
package/AGENTS.md +0 -18
package/CLAUDE.md +0 -18
package/dist/tools/webtest/crawl.d.ts.map +0 -1
package/dist/tools/webtest/crawl.js.map +0 -1
package/dist/tools/webtest/discover-features.d.ts.map +0 -1
package/dist/tools/webtest/discover-features.js.map +0 -1
package/dist/tools/webtest/discover-flows.d.ts.map +0 -1
package/dist/tools/webtest/discover-flows.js.map +0 -1
package/dist/tools/webtest/generate-tests.d.ts.map +0 -1
package/dist/tools/webtest/generate-tests.js.map +0 -1
package/dist/tools/webtest/index.d.ts.map +0 -1
package/dist/tools/webtest/index.js.map +0 -1
package/dist/tools/webtest/run-test-case.d.ts.map +0 -1
package/dist/tools/webtest/run-test-case.js.map +0 -1
package/dist/tools/webtest/schemas.d.ts.map +0 -1
package/dist/tools/webtest/schemas.js.map +0 -1
package/dist/tools/webtest/start-analysis.d.ts.map +0 -1
package/dist/tools/webtest/start-analysis.js.map +0 -1
package/openspec/AGENTS.md +0 -456
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/proposal.md +0 -33
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-resources/spec.md +0 -27
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/specs/webtest-tools/spec.md +0 -304
package/openspec/changes/archive/2025-12-18-add-hybrid-artifact-paths/tasks.md +0 -43
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/design.md +0 -209
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/proposal.md +0 -41
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/specs/mcp-server-core/spec.md +0 -183
package/openspec/changes/archive/2025-12-18-add-mcp-server-foundation/tasks.md +0 -112
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/design.md +0 -333
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/proposal.md +0 -66
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/mcp-server-core/spec.md +0 -129
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-lifecycle/spec.md +0 -138
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-logging/spec.md +0 -211
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-prompts/spec.md +0 -157
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-resources/spec.md +0 -213
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-sampling/spec.md +0 -257
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/specs/webtest-tools/spec.md +0 -501
package/openspec/changes/archive/2025-12-18-add-webtest-orchestrator/tasks.md +0 -264
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/proposal.md +0 -24
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/specs/webtest-tools/spec.md +0 -80
package/openspec/changes/archive/2025-12-18-allow-analysis-of-incomplete-crawls/tasks.md +0 -8
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/design.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/proposal.md +0 -28
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/specs/webtest-sampling/spec.md +0 -90
package/openspec/changes/archive/2025-12-18-fix-crawl-loop-stability/tasks.md +0 -33
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/design.md +0 -558
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/proposal.md +0 -119
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-resources/spec.md +0 -109
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/specs/webtest-tools/spec.md +0 -121
package/openspec/changes/archive/2025-12-18-use-markdown-artifacts/tasks.md +0 -133
package/openspec/changes/extract-prompts-to-markdown/design.md +0 -86
package/openspec/changes/extract-prompts-to-markdown/proposal.md +0 -50
package/openspec/changes/extract-prompts-to-markdown/specs/webtest-prompts/spec.md +0 -74
package/openspec/changes/extract-prompts-to-markdown/tasks.md +0 -40
package/openspec/changes/refactor-webtest-naming/design.md +0 -95
package/openspec/changes/refactor-webtest-naming/proposal.md +0 -66
package/openspec/changes/refactor-webtest-naming/specs/webtest-prompts/spec.md +0 -79
package/openspec/changes/refactor-webtest-naming/specs/webtest-resources/spec.md +0 -80
package/openspec/changes/refactor-webtest-naming/specs/webtest-sampling/spec.md +0 -122
package/openspec/changes/refactor-webtest-naming/specs/webtest-tools/spec.md +0 -113
package/openspec/changes/refactor-webtest-naming/tasks.md +0 -119
package/openspec/changes/rename-package-to-retest/proposal.md +0 -52
package/openspec/changes/rename-package-to-retest/specs/mcp-server-core/spec.md +0 -53
package/openspec/changes/rename-package-to-retest/specs/retest-lifecycle/spec.md +0 -68
package/openspec/changes/rename-package-to-retest/specs/retest-logging/spec.md +0 -35
package/openspec/changes/rename-package-to-retest/specs/retest-prompts/spec.md +0 -159
package/openspec/changes/rename-package-to-retest/specs/retest-resources/spec.md +0 -251
package/openspec/changes/rename-package-to-retest/specs/retest-sampling/spec.md +0 -99
package/openspec/changes/rename-package-to-retest/specs/retest-tools/spec.md +0 -295
package/openspec/changes/rename-package-to-retest/tasks.md +0 -71
package/openspec/project.md +0 -31
package/openspec/specs/mcp-server-core/spec.md +0 -178
package/openspec/specs/webtest-lifecycle/spec.md +0 -136
package/openspec/specs/webtest-logging/spec.md +0 -209
package/openspec/specs/webtest-prompts/spec.md +0 -155
package/openspec/specs/webtest-resources/spec.md +0 -248
package/openspec/specs/webtest-sampling/spec.md +0 -344
package/openspec/specs/webtest-tools/spec.md +0 -282
package/release.config.js +0 -9
package/src/config.test.ts +0 -96
package/src/config.ts +0 -32
package/src/elicitation/index.test.ts +0 -399
package/src/elicitation/index.ts +0 -171
package/src/elicitation/types.ts +0 -68
package/src/index.ts +0 -83
package/src/lifecycle/index.test.ts +0 -260
package/src/lifecycle/index.ts +0 -101
package/src/logger.redaction.test.ts +0 -322
package/src/logger.test.ts +0 -123
package/src/logger.ts +0 -229
package/src/playwright-client/index.ts +0 -392
package/src/playwright-client/types.ts +0 -99
package/src/progress/index.test.ts +0 -327
package/src/progress/index.ts +0 -170
package/src/progress/types.ts +0 -25
package/src/prompts/index.test.ts +0 -451
package/src/prompts/index.ts +0 -246
package/src/prompts/loader.test.ts +0 -100
package/src/prompts/loader.ts +0 -59
package/src/prompts/templates/mcp/webtest-crawl.md +0 -7
package/src/prompts/templates/mcp/webtest-full-workflow.md +0 -12
package/src/resources/index.ts +0 -250
package/src/resources/subscriptions.ts +0 -37
package/src/sampling/index.test.ts +0 -414
package/src/sampling/index.ts +0 -286
package/src/sampling/prompts.ts +0 -194
package/src/sampling/types.ts +0 -60
package/src/schemas/config.ts +0 -39
package/src/security/index.test.ts +0 -441
package/src/security/index.ts +0 -361
package/src/security/security-scenarios.test.ts +0 -468
package/src/server.ts +0 -211
package/src/test-utils/index.ts +0 -6
package/src/test-utils/mock-context.ts +0 -426
package/src/test-utils/mock-playwright-client.ts +0 -422
package/src/tools/index.ts +0 -11
package/src/tools/webtest/crawl.test.ts +0 -834
package/src/tools/webtest/crawl.ts +0 -901
package/src/tools/webtest/discover-features.ts +0 -412
package/src/tools/webtest/discover-flows.ts +0 -408
package/src/tools/webtest/generate-tests.test.ts +0 -532
package/src/tools/webtest/generate-tests.ts +0 -425
package/src/tools/webtest/index.ts +0 -7
package/src/tools/webtest/integration.test.ts +0 -536
package/src/tools/webtest/run-test-case.test.ts +0 -659
package/src/tools/webtest/run-test-case.ts +0 -508
package/src/tools/webtest/schemas.ts +0 -201
package/src/tools/webtest/start-analysis.test.ts +0 -151
package/src/tools/webtest/start-analysis.ts +0 -158
package/src/transports/http.ts +0 -19
package/src/transports/index.ts +0 -30
package/src/transports/stdio.ts +0 -7
package/src/types/capabilities.test.ts +0 -193
package/src/types/capabilities.ts +0 -50
package/src/types/context.ts +0 -21
package/src/types/tool.ts +0 -11
package/src/workspace/index.ts +0 -945
package/src/workspace/markdown.ts +0 -272
package/src/workspace/types.ts +0 -186
package/tests/integration/server.test.ts +0 -89
package/tests/integration/tools.test.ts +0 -99
package/tsconfig.json +0 -20
package/vitest.config.ts +0 -9
package/vitest.integration.config.ts +0 -10
/package/{src → dist}/prompts/templates/sampling/crawl-action.md +0 -0
/package/{src → dist}/prompts/templates/sampling/feature-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/flow-discovery.md +0 -0
/package/{src → dist}/prompts/templates/sampling/page-content-wrapper.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-evaluation.md +0 -0
/package/{src → dist}/prompts/templates/sampling/test-generation.md +0 -0
/package/dist/tools/{webtest → retest}/crawl.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-features.d.ts +0 -0
/package/dist/tools/{webtest → retest}/discover-flows.d.ts +0 -0
/package/dist/tools/{webtest → retest}/generate-tests.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.d.ts +0 -0
/package/dist/tools/{webtest → retest}/index.js +0 -0
/package/dist/tools/{webtest → retest}/run-test-case.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.d.ts +0 -0
/package/dist/tools/{webtest → retest}/schemas.js +0 -0
/package/dist/tools/{webtest → retest}/start-analysis.d.ts +0 -0

package/src/tools/webtest/run-test-case.ts DELETED Viewed

@@ -1,508 +0,0 @@
-import { z } from "zod";
-import { join } from "node:path";
-import matter from "gray-matter";
-import type { McpTool, ToolResult } from "../../types/tool.js";
-import type { ServerContext } from "../../types/context.js";
-import type { WorkspaceManager, TestCase, TestStepResult } from "../../workspace/index.js";
-import type { PlaywrightClient } from "../../playwright-client/index.js";
-import type { SamplingClient } from "../../sampling/index.js";
-import type { CancellationRegistry, ProgressEmitter } from "../../progress/index.js";
-import type { ResourceManager } from "../../resources/index.js";
-import { CancellationError } from "../../progress/index.js";
-import { buildTestEvaluationPrompt } from "../../sampling/prompts.js";
-import { TestEvaluationSchema, AnalysisIdSchema } from "./schemas.js";
-export const runTestCaseInputSchema = z.object({
-  analysisId: AnalysisIdSchema,
-  testCaseId: z.string().describe("ID of the test case to run"),
-  testsUri: z
-    .string()
-    .optional()
-    .describe("URI of the tests resource. If not provided, uses the latest tests."),
-  runOptions: z
-    .object({
-      captureEvidence: z.boolean().default(true),
-      stopOnFailure: z.boolean().default(true),
-      retryFailedSteps: z.boolean().default(false),
-    })
-    .optional()
-    .describe("Test run options"),
-});
-export type RunTestCaseInput = z.infer<typeof runTestCaseInputSchema>;
-export function createRunTestCaseTool(
-  getContext: () => ServerContext & {
-    workspaceManager: WorkspaceManager;
-    playwrightClient: PlaywrightClient;
-    samplingClient: SamplingClient;
-    cancellationRegistry: CancellationRegistry;
-    progressEmitter: ProgressEmitter;
-    resourceManager: ResourceManager;
-  }
-): McpTool<RunTestCaseInput> {
-  return {
-    name: "webtest_run_test",
-    description: `Execute a single test case against the web application.
-This tool runs one generated test case:
-- Executes each step using Playwright browser automation
-- Captures evidence (screenshots, snapshots) at each step
-- Evaluates pass/fail using AI-powered assertion checking
-- Reports detailed results with evidence links
-Requires generated test cases. Progress is reported throughout execution.`,
-    inputSchema: runTestCaseInputSchema,
-    async handler(input: RunTestCaseInput): Promise<ToolResult> {
-      const ctx = getContext();
-      const {
-        logger,
-        workspaceManager,
-        playwrightClient,
-        samplingClient,
-        cancellationRegistry,
-        progressEmitter,
-        resourceManager,
-      } = ctx;
-      const requestId = `test-${input.analysisId}-${input.testCaseId}-${Date.now()}`;
-      const runLogger = logger.withCorrelation({
-        analysisId: input.analysisId,
-        requestId,
-      });
-      runLogger.info("Starting test case execution", {
-        testCaseId: input.testCaseId,
-      });
-      // Register for cancellation
-      cancellationRegistry.register(requestId);
-      try {
-        // Validate workspace exists
-        if (!(await workspaceManager.workspaceExists(input.analysisId))) {
-          return {
-            content: [
-              {
-                type: "text",
-                text: `Error: Analysis workspace "${input.analysisId}" not found.`,
-              },
-            ],
-            isError: true,
-          };
-        }
-        const workspace = await workspaceManager.readWorkspaceIndex(input.analysisId);
-        // Check for tests
-        if (!workspace.tests) {
-          return {
-            content: [
-              {
-                type: "text",
-                text: "Error: No tests found. Run webtest_generate_tests first.",
-              },
-            ],
-            isError: true,
-          };
-        }
-        // Load tests
-        const testsUri = input.testsUri || workspace.tests.testsUri;
-        let testsData: { tests: TestCase[] };
-        try {
-          const testsContent = await resourceManager.readResource(testsUri);
-          // Parse tests from markdown frontmatter
-          const { data } = matter(testsContent.text || "");
-          testsData = data as { tests: TestCase[] };
-        } catch (error) {
-          return {
-            content: [
-              {
-                type: "text",
-                text: `Error loading tests: ${error instanceof Error ? error.message : "Unknown error"}`,
-              },
-            ],
-            isError: true,
-          };
-        }
-        // Find test case
-        const testCase = testsData.tests.find((t) => t.id === input.testCaseId);
-        if (!testCase) {
-          return {
-            content: [
-              {
-                type: "text",
-                text: `Error: Test case "${input.testCaseId}" not found. Available tests: ${testsData.tests.map((t) => t.id).join(", ")}`,
-              },
-            ],
-            isError: true,
-          };
-        }
-        const runOptions = input.runOptions ?? {
-          captureEvidence: true,
-          stopOnFailure: true,
-          retryFailedSteps: false,
-        };
-        // Create test run
-        const { runId, runPath } = await workspaceManager.createTestRun(
-          input.analysisId,
-          { testCaseId: input.testCaseId, testName: testCase.name }
-        );
-        const stepLogger = runLogger.withCorrelation({ testRunId: runId });
-        stepLogger.info("Test run created", { runId, testName: testCase.name });
-        await resourceManager.notifyListChanged();
-        // Ensure Playwright is connected
-        if (!playwrightClient.isConnected()) {
-          await playwrightClient.connect();
-        }
-        // Navigate to start URL
-        await playwrightClient.navigate(workspace.url);
-        // Execute test steps
-        const stepResults: TestStepResult[] = [];
-        let overallStatus: "passed" | "failed" | "error" = "passed";
-        let failureStep: number | undefined;
-        for (const step of testCase.steps) {
-          // Check cancellation
-          cancellationRegistry.checkCancelled(requestId);
-          // Emit progress
-          progressEmitter.emit({
-            progressToken: requestId,
-            progress: step.stepNumber,
-            total: testCase.steps.length,
-            message: `Step ${step.stepNumber}/${testCase.steps.length}: ${step.action}`,
-          });
-          stepLogger.info("Executing test step", {
-            stepNumber: step.stepNumber,
-            action: step.action,
-          });
-          const stepResult: TestStepResult = {
-            stepNumber: step.stepNumber,
-            status: "passed",
-            executedAt: new Date().toISOString(),
-            evidence: {},
-          };
-          try {
-            // Execute the step action
-            await executeTestStep(playwrightClient, step);
-            // Wait briefly for page to settle
-            await new Promise((resolve) => setTimeout(resolve, 500));
-            // Capture evidence
-            if (runOptions.captureEvidence) {
-              const screenshot = await playwrightClient.screenshot();
-              const snapshot = await playwrightClient.snapshot();
-              const evidence = await workspaceManager.saveTestStepEvidence(
-                input.analysisId,
-                runId,
-                step.stepNumber,
-                {
-                  screenshot,
-                  snapshot: JSON.stringify(snapshot),
-                }
-              );
-              stepResult.evidence = evidence;
-            }
-            // Evaluate step if expected outcome specified
-            if (step.expected && samplingClient.hasSampling()) {
-              const snapshot = await playwrightClient.snapshot();
-              const evalResult = await samplingClient.createMessage({
-                systemPrompt:
-                  "You are evaluating whether a test step produced the expected outcome.",
-                userPrompt: buildTestEvaluationPrompt({
-                  testStep: `${step.action}${step.target ? ` on "${step.target}"` : ""}${step.value ? ` with value "${step.value}"` : ""}`,
-                  expectedOutcome: step.expected,
-                  actualState: snapshot.content.slice(0, 5000),
-                }),
-                schema: TestEvaluationSchema,
-                maxTokens: 1024,
-              });
-              if (evalResult.success && evalResult.data) {
-                if (!evalResult.data.passed) {
-                  stepResult.status = "failed";
-                  stepResult.actualResult = evalResult.data.reasoning;
-                  if (overallStatus === "passed") {
-                    overallStatus = "failed";
-                    failureStep = step.stepNumber;
-                  }
-                  stepLogger.warn("Step assertion failed", {
-                    stepNumber: step.stepNumber,
-                    reasoning: evalResult.data.reasoning,
-                  });
-                  if (runOptions.stopOnFailure) {
-                    stepResults.push(stepResult);
-                    break;
-                  }
-                }
-              }
-            }
-          } catch (error) {
-            const message =
-              error instanceof Error ? error.message : "Unknown error";
-            stepResult.status = "error";
-            stepResult.errorMessage = message;
-            if (overallStatus === "passed") {
-              overallStatus = "error";
-              failureStep = step.stepNumber;
-            }
-            stepLogger.error("Step execution error", {
-              stepNumber: step.stepNumber,
-              error: message,
-            });
-            // Retry if enabled
-            if (runOptions.retryFailedSteps) {
-              stepLogger.info("Retrying failed step", {
-                stepNumber: step.stepNumber,
-              });
-              try {
-                await executeTestStep(playwrightClient, step);
-                stepResult.status = "passed";
-                stepResult.errorMessage = undefined;
-                if (failureStep === step.stepNumber) {
-                  overallStatus = "passed";
-                  failureStep = undefined;
-                }
-              } catch (retryError) {
-                // Retry also failed
-                stepLogger.error("Step retry also failed", {
-                  stepNumber: step.stepNumber,
-                });
-                if (runOptions.stopOnFailure) {
-                  stepResults.push(stepResult);
-                  break;
-                }
-              }
-            } else if (runOptions.stopOnFailure) {
-              stepResults.push(stepResult);
-              break;
-            }
-          }
-          stepResults.push(stepResult);
-        }
-        // Mark skipped steps
-        const executedSteps = stepResults.map((r) => r.stepNumber);
-        for (const step of testCase.steps) {
-          if (!executedSteps.includes(step.stepNumber)) {
-            stepResults.push({
-              stepNumber: step.stepNumber,
-              status: "skipped",
-              executedAt: new Date().toISOString(),
-              evidence: {},
-            });
-          }
-        }
-        // Sort results by step number
-        stepResults.sort((a, b) => a.stepNumber - b.stepNumber);
-        // Update test run index
-        await workspaceManager.updateTestRunIndex(input.analysisId, runId, {
-          status: overallStatus,
-          completedAt: new Date().toISOString(),
-          steps: stepResults,
-        });
-        // Update workspace run reference
-        const updatedWorkspace = await workspaceManager.readWorkspaceIndex(
-          input.analysisId
-        );
-        const runRef = updatedWorkspace.runs.find((r) => r.runId === runId);
-        if (runRef) {
-          runRef.status = overallStatus;
-          runRef.completedAt = new Date().toISOString();
-          await workspaceManager.updateWorkspaceIndex(input.analysisId, {
-            runs: updatedWorkspace.runs,
-          });
-        }
-        await resourceManager.notifyListChanged();
-        // Generate result summary
-        const passedSteps = stepResults.filter((r) => r.status === "passed").length;
-        const failedSteps = stepResults.filter((r) => r.status === "failed").length;
-        const errorSteps = stepResults.filter((r) => r.status === "error").length;
-        const skippedSteps = stepResults.filter((r) => r.status === "skipped").length;
-        const result = {
-          runId,
-          analysisId: input.analysisId,
-          testCaseId: input.testCaseId,
-          testName: testCase.name,
-          status: overallStatus,
-          summary: {
-            totalSteps: testCase.steps.length,
-            passed: passedSteps,
-            failed: failedSteps,
-            error: errorSteps,
-            skipped: skippedSteps,
-          },
-          failureStep,
-          reportFilePath: join(runPath, "report.md"),
-          reportUri: `webtest://${input.analysisId}/runs/${runId}/report.md`,
-          stepResults: stepResults.map((r) => ({
-            stepNumber: r.stepNumber,
-            status: r.status,
-            evidence: r.evidence,
-            actualResult: r.actualResult,
-            errorMessage: r.errorMessage,
-          })),
-          nextSteps:
-            overallStatus === "passed"
-              ? ["All assertions passed!", "Run more test cases as needed"]
-              : [
-                  `Investigate failure at step ${failureStep}`,
-                  `Review evidence at ${stepResults.find((r) => r.stepNumber === failureStep)?.evidence.screenshotUri || "N/A"}`,
-                ],
-        };
-        stepLogger.info("Test execution completed", {
-          status: overallStatus,
-          passed: passedSteps,
-          failed: failedSteps,
-          error: errorSteps,
-        });
-        return {
-          content: [
-            {
-              type: "text",
-              text: JSON.stringify(result, null, 2),
-            },
-          ],
-        };
-      } catch (error) {
-        if (error instanceof CancellationError) {
-          runLogger.info("Test execution cancelled", {
-            requestId: error.requestId,
-          });
-          return {
-            content: [
-              {
-                type: "text",
-                text: JSON.stringify(
-                  {
-                    status: "cancelled",
-                    message: "Test execution was cancelled by user",
-                  },
-                  null,
-                  2
-                ),
-              },
-            ],
-          };
-        }
-        const message = error instanceof Error ? error.message : "Unknown error";
-        runLogger.error("Test execution failed", { error: message });
-        return {
-          content: [
-            {
-              type: "text",
-              text: `Error during test execution: ${message}`,
-            },
-          ],
-          isError: true,
-        };
-      } finally {
-        cancellationRegistry.unregister(requestId);
-      }
-    },
-  };
-}
-async function executeTestStep(
-  playwright: PlaywrightClient,
-  step: { action: string; target?: string; value?: string; element?: string; ref?: string }
-): Promise<void> {
-  const action = step.action.toLowerCase();
-  // Use element/ref if provided, otherwise fall back to target as the element description
-  // with an empty ref (some implementations may accept this)
-  const element = step.element || step.target || "";
-  const ref = step.ref || "";
-  // Parse the action to determine what to do
-  if (action.includes("navigate") || action.includes("go to")) {
-    const url = step.value || step.target || "";
-    if (url) {
-      await playwright.navigate(url);
-    }
-  } else if (action.includes("click")) {
-    if (element) {
-      await playwright.click(element, ref);
-    }
-  } else if (action.includes("type") || action.includes("enter")) {
-    if (element && step.value) {
-      await playwright.type(element, ref, step.value);
-    }
-  } else if (action.includes("fill")) {
-    if (element && step.value) {
-      await playwright.fill(element, ref, step.value);
-    }
-  } else if (action.includes("hover")) {
-    if (element) {
-      await playwright.hover(element, ref);
-    }
-  } else if (action.includes("select")) {
-    if (element && step.value) {
-      // Convert single value to array as required by the API
-      const values = step.value.includes(",")
-        ? step.value.split(",").map(v => v.trim())
-        : [step.value];
-      await playwright.select(element, ref, values);
-    }
-  } else if (action.includes("press")) {
-    if (step.value) {
-      // press only takes the key, no element targeting
-      await playwright.press(step.value);
-    }
-  } else if (action.includes("scroll")) {
-    const x = parseInt(step.target || "0", 10);
-    const y = parseInt(step.value || "0", 10);
-    await playwright.scroll(x, y);
-  } else if (action.includes("wait")) {
-    const ms = parseInt(step.value || "1000", 10);
-    await playwright.wait(ms);
-  } else {
-    // Default: try to interpret as click if element provided
-    if (element) {
-      await playwright.click(element, ref);
-    }
-  }
-}

package/src/tools/webtest/schemas.ts DELETED Viewed

@@ -1,201 +0,0 @@
-import { z } from "zod";
-// Common schemas used across webtest tools
-/**
- * Analysis ID schema - accepts either:
- * - Date-time format: YYYY-MM-DD_HH-mm (new format for workspace folders)
- * - UUID format (legacy support)
- */
-export const AnalysisIdSchema = z
-  .string()
-  .describe("Analysis workspace ID in format YYYY-MM-DD_HH-mm (e.g., 2025-12-18_17-05) or legacy UUID")
-  .refine(
-    (val) => {
-      // Match date-time format: YYYY-MM-DD_HH-mm
-      const dateTimePattern = /^\d{4}-\d{2}-\d{2}_\d{2}-\d{2}$/;
-      // Match UUID format (for legacy support)
-      const uuidPattern = /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;
-      return dateTimePattern.test(val) || uuidPattern.test(val);
-    },
-    { message: "Invalid analysis ID. Expected format: YYYY-MM-DD_HH-mm or UUID" }
-  );
-/**
- * Crawl ID schema - accepts either:
- * - Date-time format with seconds: YYYY-MM-DD_HH-mm-ss (new format for crawl folders)
- * - UUID format (legacy support)
- */
-export const CrawlIdSchema = z
-  .string()
-  .describe("Crawl ID in format YYYY-MM-DD_HH-mm-ss (e.g., 2025-12-18_17-06-20) or legacy UUID")
-  .refine(
-    (val) => {
-      // Match date-time format with seconds: YYYY-MM-DD_HH-mm-ss
-      const dateTimePattern = /^\d{4}-\d{2}-\d{2}_\d{2}-\d{2}-\d{2}$/;
-      // Match UUID format (for legacy support)
-      const uuidPattern = /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;
-      return dateTimePattern.test(val) || uuidPattern.test(val);
-    },
-    { message: "Invalid crawl ID. Expected format: YYYY-MM-DD_HH-mm-ss or UUID" }
-  );
-export const AnalysisLimitsSchema = z.object({
-  maxSteps: z.number().int().min(1).max(1000).optional(),
-  maxMinutes: z.number().int().min(1).max(180).optional(),
-  maxPages: z.number().int().min(1).max(100).optional(),
-});
-export type AnalysisLimits = z.infer<typeof AnalysisLimitsSchema>;
-export const DomainAllowlistSchema = z.array(z.string()).optional();
-// Sampling response schemas
-/**
- * Args structure per tool (Microsoft Playwright MCP compatible):
- * - navigate: { url: string }
- * - click: { element: string, ref: string }
- * - type: { element: string, ref: string, text: string, submit?: boolean, slowly?: boolean }
- * - fill: { element: string, ref: string, value: string }
- * - hover: { element: string, ref: string }
- * - select: { element: string, ref: string, values: string[] }
- * - press: { key: string }  // No element targeting
- * - scroll: { x: number, y: number }
- * - wait: { ms: number }
- *
- * The `element` field is a human-readable description of the element.
- * The `ref` field is the exact element reference from the accessibility snapshot (e.g., "e1", "e3").
- */
-export const CrawlActionSchema = z.object({
-  actions: z.array(
-    z.object({
-      tool: z.enum([
-        "navigate",
-        "click",
-        "type",
-        "fill",
-        "hover",
-        "select",
-        "press",
-        "scroll",
-        "wait",
-      ]),
-      args: z.record(z.string(), z.any()),
-    })
-  ),
-  reasoning: z.string(),
-  goalProgress: z.string(),
-  goalComplete: z.boolean().optional(),
-  blocked: z.boolean().optional(),
-  blockedReason: z.string().optional(),
-  elicitationNeeded: z
-    .object({
-      type: z.enum([
-        "cookie_consent",
-        "modal_blocking",
-        "ambiguous_navigation",
-        "auth_required",
-      ]),
-      context: z.string(),
-      options: z
-        .array(
-          z.object({
-            url: z.string().optional(),
-            label: z.string(),
-          })
-        )
-        .optional(),
-    })
-    .optional(),
-});
-export type CrawlAction = z.infer<typeof CrawlActionSchema>;
-// Feature-based schemas
-export const FeatureSchema = z.object({
-  slug: z.string().describe("URL-safe identifier for the feature (kebab-case)"),
-  name: z.string().describe("Human-readable feature name"),
-  description: z.string().describe("Brief description of what this feature does"),
-  entities: z.array(z.string()).describe("Key entities/data types in this feature"),
-  entryPoints: z.array(z.string()).describe("URLs or navigation paths to access this feature"),
-});
-export type Feature = z.infer<typeof FeatureSchema>;
-export const FeaturesDiscoverySchema = z.object({
-  appPurpose: z.string().describe("Overall purpose of the application"),
-  appType: z.string().describe("Type of application (e.g., e-commerce, SaaS, content site)"),
-  features: z.array(FeatureSchema).describe("Distinct features/modules of the application"),
-  securityObservations: z.array(z.string()).optional(),
-  accessibilityObservations: z.array(z.string()).optional(),
-});
-export type FeaturesDiscovery = z.infer<typeof FeaturesDiscoverySchema>;
-export const FlowSchema = z.object({
-  id: z.string().describe("Unique flow identifier"),
-  name: z.string().describe("Human-readable flow name"),
-  description: z.string().describe("What this flow accomplishes"),
-  entryPoint: z.string().describe("Starting URL or navigation path"),
-  steps: z.array(z.string()).describe("Ordered list of steps in the flow"),
-});
-export type Flow = z.infer<typeof FlowSchema>;
-export const FlowsDiscoverySchema = z.object({
-  featureSlug: z.string().describe("The feature these flows belong to"),
-  flows: z.array(FlowSchema).describe("User flows within this feature"),
-  suggestedAssertions: z.array(z.string()).describe("Assertions that should hold for these flows"),
-});
-export type FlowsDiscovery = z.infer<typeof FlowsDiscoverySchema>;
-export const FeatureSlugSchema = z
-  .string()
-  .regex(/^[a-z0-9]+(?:-[a-z0-9]+)*$/, "Feature slug must be kebab-case (e.g., 'user-auth', 'shopping-cart')")
-  .describe("Feature identifier in kebab-case");
-export const TestCaseSchema = z.object({
-  id: z.string(),
-  name: z.string(),
-  purpose: z.string(),
-  category: z.enum(["happy_path", "edge_case", "error_handling", "boundary"]),
-  preconditions: z.array(z.string()),
-  steps: z.array(
-    z.object({
-      stepNumber: z.number().int(),
-      action: z.string(),
-      target: z.string().optional(), // Kept for backwards compatibility
-      value: z.string().optional(),
-      expected: z.string().optional(),
-      // Microsoft Playwright MCP compatible fields
-      element: z.string().optional(), // Human-readable element description
-      ref: z.string().optional(), // Element reference from accessibility snapshot (e.g., "e1", "e3")
-    })
-  ),
-  expectedOutcomes: z.array(z.string()),
-  tags: z.array(z.string()).optional(),
-});
-export type TestCase = z.infer<typeof TestCaseSchema>;
-export const TestGenerationSchema = z.object({
-  tests: z.array(TestCaseSchema),
-  coverage: z.object({
-    flowsCovered: z.array(z.string()),
-    estimatedCoverage: z.string(),
-  }),
-});
-export type TestGeneration = z.infer<typeof TestGenerationSchema>;
-export const TestEvaluationSchema = z.object({
-  passed: z.boolean(),
-  reasoning: z.string(),
-  evidence: z.array(z.string()),
-  discrepancies: z.array(z.string()).optional(),
-});
-export type TestEvaluation = z.infer<typeof TestEvaluationSchema>;