npm - testdriverai - Versions diffs - 7.8.0-test.7 → 7.8.0-test.71 - Mend

testdriverai 7.8.0-test.7 → 7.8.0-test.71

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (98) hide show

package/agent/index.js +18 -5
package/agent/lib/commands.js +3 -2
package/agent/lib/http.js +162 -0
package/agent/lib/logger.js +15 -0
package/agent/lib/sandbox.js +554 -209
package/agent/lib/sdk.js +5 -22
package/agent/lib/system.js +25 -65
package/ai/skills/testdriver-cache/SKILL.md +221 -0
package/ai/skills/testdriver-errors/SKILL.md +246 -0
package/ai/skills/testdriver-events/SKILL.md +356 -0
package/ai/skills/testdriver-find/SKILL.md +14 -20
package/ai/skills/testdriver-mcp/SKILL.md +7 -0
package/ai/skills/testdriver-provision/SKILL.md +331 -0
package/ai/skills/testdriver-redraw/SKILL.md +214 -0
package/ai/skills/testdriver-running-tests/SKILL.md +1 -1
package/ai/skills/testdriver-screenshots/SKILL.md +184 -0
package/docs/_data/examples-manifest.json +46 -46
package/docs/_scripts/extract-example-urls.js +67 -72
package/docs/changelog.mdx +148 -8
package/docs/docs.json +46 -38
package/docs/images/content/vscode/v7-chat.png +0 -0
package/docs/images/content/vscode/v7-choose-agent.png +0 -0
package/docs/images/content/vscode/v7-full.png +0 -0
package/docs/images/content/vscode/v7-onboarding.png +0 -0
package/docs/v7/cache.mdx +223 -0
package/docs/v7/copilot/auto-healing.mdx +265 -0
package/docs/v7/copilot/creating-tests.mdx +156 -0
package/docs/v7/copilot/github.mdx +143 -0
package/docs/v7/copilot/running-tests.mdx +149 -0
package/docs/v7/copilot/setup.mdx +143 -0
package/docs/v7/enterprise.mdx +3 -110
package/docs/v7/errors.mdx +248 -0
package/docs/v7/events.mdx +358 -0
package/docs/v7/examples/ai.mdx +1 -1
package/docs/v7/examples/assert.mdx +1 -1
package/docs/v7/examples/captcha-api.mdx +1 -1
package/docs/v7/examples/chrome-extension.mdx +1 -1
package/docs/v7/examples/drag-and-drop.mdx +1 -1
package/docs/v7/examples/element-not-found.mdx +1 -1
package/docs/v7/examples/exec-output.mdx +85 -0
package/docs/v7/examples/exec-pwsh.mdx +83 -0
package/docs/v7/examples/focus-window.mdx +62 -0
package/docs/v7/examples/hover-image.mdx +1 -1
package/docs/v7/examples/hover-text.mdx +1 -1
package/docs/v7/examples/installer.mdx +1 -1
package/docs/v7/examples/launch-vscode-linux.mdx +1 -1
package/docs/v7/examples/match-image.mdx +1 -1
package/docs/v7/examples/press-keys.mdx +1 -1
package/docs/v7/examples/scroll-keyboard.mdx +1 -1
package/docs/v7/examples/scroll-until-image.mdx +1 -1
package/docs/v7/examples/scroll-until-text.mdx +1 -1
package/docs/v7/examples/scroll.mdx +1 -1
package/docs/v7/examples/type.mdx +1 -1
package/docs/v7/examples/windows-installer.mdx +1 -1
package/docs/v7/find.mdx +14 -20
package/docs/v7/{cloud.mdx → hosted.mdx} +43 -5
package/docs/v7/mcp.mdx +9 -0
package/docs/v7/provision.mdx +333 -0
package/docs/v7/quickstart.mdx +30 -2
package/docs/v7/redraw.mdx +216 -0
package/docs/v7/running-tests.mdx +1 -1
package/docs/v7/screenshots.mdx +186 -0
package/docs/v7/self-hosted.mdx +127 -44
package/docs/v7/test-results-json.mdx +258 -0
package/examples/scroll-keyboard.test.mjs +1 -1
package/examples/scroll.test.mjs +1 -12
package/interfaces/logger.js +0 -12
package/interfaces/vitest-plugin.mjs +170 -51
package/lib/core/Dashcam.js +30 -23
package/lib/environments.json +22 -0
package/lib/github-comment.mjs +58 -40
package/lib/init-project.js +5 -67
package/lib/resolve-channel.js +42 -12
package/lib/sentry.js +47 -23
package/lib/vitest/hooks.mjs +63 -3
package/{examples → manual}/drag-and-drop.test.mjs +1 -1
package/manual/exec-stream-logs.test.mjs +25 -0
package/mcp-server/dist/server.mjs +28 -8
package/mcp-server/src/server.ts +31 -8
package/package.json +4 -3
package/sdk.d.ts +4 -0
package/sdk.js +45 -15
package/setup/aws/install-dev-runner.sh +79 -0
package/setup/aws/spawn-runner.sh +165 -0
package/test-sentry-span.js +35 -0
package/vitest.config.mjs +22 -34
package/vitest.runner.config.mjs +33 -0
/package/{examples → manual}/flake-diffthreshold-001.test.mjs +0 -0
/package/{examples → manual}/flake-diffthreshold-01.test.mjs +0 -0
/package/{examples → manual}/flake-diffthreshold-05.test.mjs +0 -0
/package/{examples → manual}/flake-noredraw-cache.test.mjs +0 -0
/package/{examples → manual}/flake-noredraw-nocache.test.mjs +0 -0
/package/{examples → manual}/flake-redraw-cache.test.mjs +0 -0
/package/{examples → manual}/flake-redraw-nocache.test.mjs +0 -0
/package/{examples → manual}/flake-rocket-match.test.mjs +0 -0
/package/{examples → manual}/flake-shared.mjs +0 -0
/package/{examples → manual}/no-provision.test.mjs +0 -0
/package/{examples → manual}/scroll-until-text.test.mjs +0 -0

package/docs/v7/test-results-json.mdx ADDED Viewed

@@ -0,0 +1,258 @@
+---
+title: "Test Result JSON"
+sidebarTitle: "Test Result JSON"
+description: "Per-test JSON result files with metadata, versions, and infrastructure details"
+icon: "file-code"
+---
+## Overview
+TestDriver automatically writes a JSON result file for each test case after it finishes. These files contain comprehensive metadata about the test run, including SDK and runner versions, infrastructure details, interaction statistics, and links to recordings.
+Result files are written to:
+```
+.testdriver/results/<testFile>/<testName>.json
+```
+For example, a test file `tests/login.test.mjs` with a test named `"should log in"` produces:
+```
+.testdriver/results/tests/login.test.mjs/should_log_in.json
+```
+<Note>
+  Test names are sanitized for filesystem use — special characters are replaced with underscores and names are truncated to 200 characters.
+</Note>
+## Enabling
+No configuration is required. The JSON files are written automatically by the TestDriver Vitest reporter plugin whenever tests run.
+## JSON Schema
+Each result file is organized into logical groups:
+### `versions`
+| Field | Type | Description |
+|---|---|---|
+| `versions.sdk` | `string \| null` | TestDriver SDK version (e.g. `"7.8.0"`) |
+| `versions.vitest` | `string \| null` | Vitest version used to run the test |
+| `versions.api` | `string \| null` | TestDriver API server version |
+| `versions.runnerBefore` | `string \| null` | Runner version at sandbox start |
+| `versions.runnerAfter` | `string \| null` | Runner version after auto-update |
+| `versions.runnerWasUpdated` | `boolean` | Whether the runner was auto-updated during provisioning |
+### `test`
+| Field | Type | Description |
+|---|---|---|
+| `test.file` | `string \| null` | Relative path to the test file |
+| `test.name` | `string \| null` | Name of the test case |
+| `test.suite` | `string \| null` | Name of the parent `describe` block |
+| `test.passed` | `boolean` | Whether the test passed |
+| `test.caseId` | `string \| null` | Database ID for this test case |
+| `test.runId` | `string \| null` | Database ID for the overall test run |
+| `test.error` | `string \| null` | Error message if the test failed |
+| `test.errorStack` | `string \| null` | Error stack trace if the test failed |
+### `urls`
+| Field | Type | Description |
+|---|---|---|
+| `urls.api` | `string \| null` | API root URL used for this test |
+| `urls.console` | `string \| null` | TestDriver console base URL |
+| `urls.vnc` | `string \| null` | VNC URL for the sandbox |
+| `urls.testRun` | `string \| null` | Direct link to this test case in the console |
+### `replay`
+The `replay` object contains the recording replay URL and derived embed links. The `gifUrl` and `embedUrl` are generated automatically from the replay URL.
+| Field | Type | Description |
+|---|---|---|
+| `replay.url` | `string \| null` | Recording replay URL |
+| `replay.gifUrl` | `string \| null` | Animated GIF thumbnail of the recording |
+| `replay.embedUrl` | `string \| null` | Embeddable replay URL (appends `&embed=true`) |
+| `replay.markdown` | `string \| null` | Ready-to-use Markdown embed with GIF linking to the replay |
+The `replay.markdown` field produces a clickable GIF badge you can paste directly into PR comments, README files, or issue descriptions:
+```markdown
+[![Test Recording](https://api.testdriver.ai/replay/abc123/gif?shareKey=xyz)](https://console.testdriver.ai/replay/abc123?share=xyz)
+```
+### `date`
+| Field | Type | Description |
+|---|---|---|
+| `date` | `string` | ISO 8601 timestamp when the test finished |
+### `team`
+| Field | Type | Description |
+|---|---|---|
+| `team.id` | `string \| null` | Team ID from the sandbox |
+| `team.sessionId` | `string \| null` | SDK session ID |
+### `infrastructure`
+| Field | Type | Description |
+|---|---|---|
+| `infrastructure.sandboxId` | `string \| null` | Sandbox instance ID |
+| `infrastructure.instanceId` | `string \| null` | Instance ID |
+| `infrastructure.os` | `string \| null` | Operating system of the sandbox (`"linux"` or `"windows"`) |
+| `infrastructure.amiId` | `string \| null` | AWS AMI ID used for provisioning |
+| `infrastructure.e2bTemplateId` | `string \| null` | E2B template ID used for provisioning |
+| `infrastructure.imageVersion` | `string \| null` | Sandbox image version |
+### `realtime`
+| Field | Type | Description |
+|---|---|---|
+| `realtime.channel` | `string \| null` | Ably channel name used for communication |
+| `realtime.messageCount` | `number` | Number of messages published to the realtime channel |
+### `interactions`
+| Field | Type | Description |
+|---|---|---|
+| `interactions.total` | `number` | Total number of interactions recorded |
+| `interactions.cached` | `number` | Number of interactions served from cache |
+| `interactions.byType` | `object` | Breakdown of interactions by type (e.g. `find`, `click`, `assert`) |
+## Example Output
+```json
+{
+  "sdkVersion": "7.8.0",
+  "vitestVersion": "4.0.0",
+  "apiVersion": "1.45.0",
+  "runnerVersionBefore": "2.1.0",
+  "runnerVersionAfter": "2.1.1",
+  "wasUpdated": true,
+  "apiUrl": "https://api.testdriver.ai",
+  "consoleUrl": "https://console.testdriver.ai",
+  "testRunLink": "https://console.testdriver.ai/runs/abc123/def456",
+  "dashcamUrl": "https://app.dashcam.io/replay/abc123",
+  "vncUrl": "wss://sandbox-123.testdriver.ai/vnc",
+  "date": "2025-01-15T14:30:00.000Z",
+  "team": {
+    "id": "team_abc123",
+    "sessionId": "sess_xyz789"
+  },
+  "infrastructure": {
+    "sandboxId": "sandbox-123",
+    "instanceId": "i-abc123",
+    "os": "linux",
+    "amiId": "ami-0abc123",
+    "e2bTemplateId": null,
+    "imageVersion": "v2.1.0"
+  },
+  "realtime": {
+    "channel": "sandbox:sandbox-123",
+    "messageCount": 42
+  },
+  "interactions": {
+    "total": 15,
+    "cached": 3,
+    "byType": {
+      "find": 8,
+      "click": 5,
+      "assert": 2
+    }
+  }
+}
+```
+## Using Result Files in CI
+Result files are useful for extracting test metadata in CI pipelines without parsing log output.
+### GitHub Actions Example
+Use `fromJSON` to parse a result file into a GitHub Actions expression you can reference in subsequent steps:
+```yaml
+- name: Run tests
+  run: npx vitest run tests/login.test.mjs
+- name: Parse result
+  id: result
+  run: |
+    # Read the first JSON result file
+    FILE=$(find .testdriver/results -name '*.json' | head -n 1)
+    echo "json=$(cat "$FILE")" >> "$GITHUB_OUTPUT"
+- name: Comment on PR
+  if: fromJSON(steps.result.outputs.json).test.passed == false
+  uses: actions/github-script@v7
+  with:
+    script: |
+      const result = ${{ steps.result.outputs.json }};
+      await github.rest.issues.createComment({
+        owner: context.repo.owner,
+        repo: context.repo.repo,
+        issue_number: context.issue.number,
+        body: [
+          `❌ **${result.test.name}** failed`,
+          ``,
+          `Error: ${result.test.error}`,
+          ``,
+          result.replay.markdown,
+          ``,
+          `[View full recording](${result.urls.testRun})`
+        ].join('\n')
+      });
+```
+You can also load all results into a matrix or iterate over them:
+```yaml
+- name: Run tests
+  run: npx vitest run tests/*.test.mjs
+- name: Collect results
+  id: results
+  run: |
+    # Merge all result files into a JSON array
+    echo "json=$(find .testdriver/results -name '*.json' -exec cat {} + | jq -s '.')" >> "$GITHUB_OUTPUT"
+- name: Summary
+  run: |
+    echo '## Test Results' >> $GITHUB_STEP_SUMMARY
+    RESULTS='${{ steps.results.outputs.json }}'
+    echo "$RESULTS" | jq -r '.[] | "| \(.test.name) | \(if .test.passed then "✅" else "❌" end) | \(.urls.testRun) |"' >> $GITHUB_STEP_SUMMARY
+```
+### Reading Results Programmatically
+```javascript
+import fs from "fs";
+import path from "path";
+const resultsDir = ".testdriver/results";
+function readResults(dir) {
+  const results = [];
+  for (const testDir of fs.readdirSync(dir, { recursive: true })) {
+    const fullPath = path.join(dir, testDir);
+    if (fullPath.endsWith(".json") && fs.statSync(fullPath).isFile()) {
+      results.push(JSON.parse(fs.readFileSync(fullPath, "utf-8")));
+    }
+  }
+  return results;
+}
+const results = readResults(resultsDir);
+const passed = results.filter(r => r.test.passed);
+const failed = results.filter(r => !r.test.passed);
+console.log(`${passed.length} passed, ${failed.length} failed`);
+for (const r of failed) {
+  console.log(`  FAIL: ${r.test.name} — ${r.test.error}`);
+  console.log(`  Recording: ${r.urls.testRun}`);
+  console.log(`  Embed: ${r.replay.markdown}`);
+}
+```

package/examples/scroll-keyboard.test.mjs CHANGED Viewed

@@ -16,7 +16,7 @@ describe("Scroll Keyboard Test", () => {
     // Navigate to https://www.webhamster.com/
     await testdriver.focusApplication("Google Chrome");
     const urlBar = await testdriver.find(
-      "testdriver-sandbox.vercel.app/login, the URL in the omnibox showing the current page", {zoom: true}
+      "the URL in the omnibox", {zoom: true}
     );
     await urlBar.click();
     await testdriver.pressKeys(["ctrl", "a"]);

package/examples/scroll.test.mjs CHANGED Viewed

@@ -12,19 +12,8 @@ import { getDefaults } from "./config.mjs";
 describe("Scroll Test", () => {
   it("should navigate and scroll down the page", async (context) => {
     const testdriver = TestDriver(context, { ...getDefaults(context), headless: true });
-    await testdriver.provision.chrome({ url: 'http://testdriver-sandbox.vercel.app/login' });
+    await testdriver.provision.chrome({ url: 'https://www.webhamster.com/' });
-    // Give Chrome a moment to fully render the UI
-    await new Promise(resolve => setTimeout(resolve, 2000));
-    // Navigate to webhamster.com - just look for the domain, not the full path
-    const urlBar = await testdriver.find(
-      "testdriver-sandbox.vercel.app, the URL in the address bar",
-    );
-    await urlBar.click();
-    await testdriver.pressKeys(["ctrl", "a"]);
-    await testdriver.type("https://www.webhamster.com/");
-    await testdriver.pressKeys(["enter"]);
     // Wait for page to load and click heading
     const heading = await testdriver.find(

package/interfaces/logger.js CHANGED Viewed

@@ -24,18 +24,6 @@ class CustomTransport extends Transport {
         return;
       }
-      if (!this.sandbox) {
-        this.sandbox = require("../agent/lib/sandbox");
-      }
-      if (this.sandbox && this.sandbox.instanceSocketConnected) {
-        this.sandbox.send({
-          type: "output",
-          output: Buffer.from(message).toString("base64"),
-        }).catch((e) => {
-          console.error("Error sending log:", e);
-        });
-      }
     } catch (e) {
       console.error("Error in CustomTransport log method:", e);
     }