npm - testdriverai - Versions diffs - 7.2.2 → 7.2.9 - Mend

testdriverai 7.2.2 → 7.2.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/.github/workflows/publish.yaml +15 -7
package/.github/workflows/testdriver.yml +36 -0
package/agent/index.js +28 -109
package/bin/testdriverai.js +8 -0
package/debugger/index.html +37 -0
package/docs/docs.json +2 -11
package/docs/v7/_drafts/architecture.mdx +1 -26
package/docs/v7/_drafts/provision.mdx +251 -188
package/docs/v7/_drafts/quick-start-test-recording.mdx +0 -1
package/docs/v7/_drafts/test-recording.mdx +0 -6
package/docs/v7/api/act.mdx +1 -0
package/docs/v7/getting-started/quickstart.mdx +9 -16
package/interfaces/cli/commands/init.js +33 -19
package/interfaces/cli/lib/base.js +24 -0
package/interfaces/cli.js +8 -1
package/interfaces/logger.js +8 -3
package/interfaces/vitest-plugin.mjs +16 -71
package/lib/sentry.js +343 -0
package/lib/vitest/hooks.mjs +23 -31
package/package.json +4 -3
package/sdk-log-formatter.js +41 -0
package/sdk.js +335 -94
package/test/testdriver/act.test.mjs +30 -0
package/test/testdriver/assert.test.mjs +1 -1
package/test/testdriver/hover-text.test.mjs +1 -1
package/test/testdriver/installer.test.mjs +47 -0
package/test/testdriver/launch-vscode-linux.test.mjs +55 -0
package/test/testdriver/setup/testHelpers.mjs +8 -118
package/tests/example.test.js +33 -0
package/tests/login.js +28 -0
package/vitest.config.js +18 -0
package/vitest.config.mjs +1 -0
package/agent/lib/cache.js +0 -142

package/.github/workflows/publish.yaml CHANGED Viewed

@@ -1,12 +1,13 @@
-name: Publish Beta
+name: Publish
 permissions:
     contents: write
+    id-token: write  # Required for OIDC
 on:
   push:
     branches: [ main ]
 jobs:
-  publish-beta:
+  publish:
     runs-on: ubuntu-latest
     steps:
@@ -29,16 +30,23 @@ jobs:
     - name: Install dependencies
       run: npm ci
-    - name: Bump version (prerelease beta)
-      run: npm version prerelease --preid=beta --no-git-tag-version
+    - name: Bump version (patch)
+      run: npm version patch --no-git-tag-version
     - name: Commit and push version bump
       run: |
         git add package.json package-lock.json
-        git commit -m "chore: bump beta version to $(node -p "require('./package.json').version")"
+        git commit -m "chore: bump version to $(node -p "require('./package.json').version")"
         git push
-    - name: Publish to npm under beta tag
-      run: npm publish --tag beta
+    - name: Debug NPM Token
+      run: |
+        echo "NPM_TOKEN is set: ${{ secrets.NPM_TOKEN != '' }}"
+        echo "NPM_TOKEN first 4 chars: ${NPM_TOKEN:0:4}..."
+      env:
+        NPM_TOKEN: ${{ secrets.NPM_TOKEN }}
+    - name: Publish to npm
+      run: npm publish --tag beta
       env:
         NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }}

package/.github/workflows/testdriver.yml ADDED Viewed

@@ -0,0 +1,36 @@
+name: TestDriver.ai Tests
+on:
+  push:
+    branches: [ main, master ]
+  pull_request:
+    branches: [ main, master ]
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v4
+    - name: Setup Node.js
+      uses: actions/setup-node@v4
+      with:
+        node-version: '20'
+        cache: 'npm'
+    - name: Install dependencies
+      run: npm ci
+    - name: Run TestDriver.ai tests
+      env:
+        TD_API_KEY: ${{ secrets.TD_API_KEY }}
+      run: npx vitest run
+    - name: Upload test results
+      if: always()
+      uses: actions/upload-artifact@v4
+      with:
+        name: test-results
+        path: test-results/
+        retention-days: 30

package/agent/index.js CHANGED Viewed

@@ -17,7 +17,6 @@ const diff = require("diff");
 // global utilities
 const generator = require("./lib/generator.js");
-const promptCache = require("./lib/cache.js");
 const theme = require("./lib/theme.js");
 const SourceMapper = require("./lib/source-mapper.js");
@@ -110,6 +109,10 @@ class TestDriverAgent extends EventEmitter2 {
     // Create sandbox instance with this agent's emitter, analytics, and session
     this.sandbox = createSandbox(this.emitter, this.analytics, this.session);
+    // Attach Sentry log listeners to capture CLI logs as breadcrumbs
+      const sentry = require("../lib/sentry");
+      sentry.attachLogListeners(this.emitter);
     // Set the OS for the sandbox to use
     this.sandbox.os = this.sandboxOs;
@@ -191,6 +194,15 @@ class TestDriverAgent extends EventEmitter2 {
       this.redraw.cleanup();
     }
+    // Close sandbox connection to release the connection slot
+    if (this.sandbox) {
+      try {
+        this.sandbox.close();
+      } catch (err) {
+        // Ignore sandbox close errors during exit
+      }
+    }
     shouldRunPostrun =
       !this.hasRunPostrun &&
       (shouldRunPostrun || this.cliArgs?.command == "run");
@@ -356,7 +368,7 @@ class TestDriverAgent extends EventEmitter2 {
           image,
         },
         (chunk) => {
-          if (chunk.type === "data") {
+          if (chunk.type === "data" && chunk.data) {
             this.emitter.emit(events.log.markdown.chunk, streamId, chunk.data);
           }
         },
@@ -420,9 +432,6 @@ class TestDriverAgent extends EventEmitter2 {
     let mousePosition = await this.system.getMousePosition();
     let activeWindow = await this.system.activeWin();
-    const streamId = `check-${Date.now()}`;
-    this.emitter.emit(events.log.markdown.start, streamId);
     let response = await this.sdk.req(
       "check",
       {
@@ -430,15 +439,10 @@ class TestDriverAgent extends EventEmitter2 {
         images,
         mousePosition,
         activeWindow,
-      },
-      (chunk) => {
-        if (chunk.type === "data") {
-          this.emitter.emit(events.log.markdown.chunk, streamId, chunk.data);
-        }
-      },
+      }
     );
-    this.emitter.emit(events.log.markdown.end, streamId);
+    this.emitter.emit(events.log.markdown.static, response.data);
     this.lastScreenshot = thisScreenshot;
@@ -869,8 +873,7 @@ commands:
     currentTask,
     dry = false,
     validateAndLoop = false,
-    shouldSave = true,
-    useCache = true,
+    shouldSave = true
   ) {
     // Check if execution has been stopped
     if (this.stopped) {
@@ -889,56 +892,10 @@ commands:
     this.tasks.push(currentTask);
-    // Check cache first (if enabled via parameter)
-    const cachedYaml = useCache ? promptCache.readCache(currentTask) : null;
-    if (cachedYaml) {
-      // Cache hit - load and execute the cached YAML file
-      this.emitter.emit(
-        events.log.debug,
-        `Using cached response for prompt: "${currentTask}"`,
-      );
-      this.emitter.emit(events.log.log, theme.dim("(using cached response)"));
-      try {
-        // Load the YAML using hydrateFromYML
-        const parsed = await generator.hydrateFromYML(
-          cachedYaml,
-          this.sessionInstance,
-        );
-        // Execute the commands from the first step
-        if (parsed.steps && parsed.steps.length > 0) {
-          const step = parsed.steps[0];
-          if (step.commands) {
-            await this.executeCommands(
-              step.commands,
-              0,
-              false,
-              dry,
-              shouldSave,
-            );
-          }
-        }
-      } catch (err) {
-        this.emitter.emit(
-          events.log.debug,
-          `Error loading cached YAML: ${err.message}, falling back to API`,
-        );
-        // Fall through to make API call if cache is invalid
-      }
-      return;
-    }
-    // Cache miss - call the API
     this.emitter.emit(events.log.narration, theme.dim("thinking..."), true);
     this.lastScreenshot = await this.system.captureScreenBase64();
-    const streamId = `input-${Date.now()}`;
-    this.emitter.emit(events.log.markdown.start, streamId);
     let message = await this.sdk.req(
       "input",
       {
@@ -946,59 +903,12 @@ commands:
         mousePosition: await this.system.getMousePosition(),
         activeWindow: await this.system.activeWin(),
         image: this.lastScreenshot,
-      },
-      (chunk) => {
-        if (chunk.type === "data") {
-          this.emitter.emit(events.log.markdown.chunk, streamId, chunk.data);
-        }
-      },
+      }
     );
-    this.emitter.emit(events.log.markdown.end, streamId);
+    this.emitter.emit(events.log.log, message.data);
     if (message && message.data) {
-      // Save the YAML to cache (if enabled)
-      if (useCache) {
-        try {
-          // Extract YAML code blocks from the markdown response
-          const codeblocks = await this.parser.findCodeBlocks(message.data);
-          if (codeblocks && codeblocks.length > 0) {
-            // Parse commands from all code blocks
-            const allCommands = [];
-            for (const block of codeblocks) {
-              const commands = await this.parser.getCommands(block);
-              allCommands.push(...commands);
-            }
-            // Create a proper step with prompt
-            const step = {
-              prompt: currentTask,
-              commands: allCommands,
-            };
-            // Use dumpToYML to create a valid testdriver yaml file
-            const yamlContent = await generator.dumpToYML(
-              [step],
-              this.sessionInstance,
-            );
-            const cachePath = promptCache.writeCache(currentTask, yamlContent);
-            if (cachePath) {
-              this.emitter.emit(
-                events.log.debug,
-                `Cached YAML saved to: ${cachePath}`,
-              );
-            }
-          }
-        } catch (err) {
-          // If we can't extract YAML, just skip caching
-          this.emitter.emit(
-            events.log.debug,
-            `Could not cache response: ${err.message}`,
-          );
-        }
-      }
       await this.aiExecute(message.data, validateAndLoop, dry, shouldSave);
       this.emitter.emit(
         events.log.debug,
@@ -2200,6 +2110,15 @@ Please check your network connection, TD_API_KEY, or the service status.`,
     }
     this.session.set(sessionRes.data.id);
+    // Set Sentry session trace context for distributed tracing
+    // This links CLI errors/logs to the same trace as API calls
+    try {
+      const sentry = require("../lib/sentry");
+      sentry.setSessionTraceContext(sessionRes.data.id);
+    } catch (e) {
+      // Sentry module may not be available, ignore
+    }
   }
   // Helper method to find testdriver directory by traversing up from a file path

package/bin/testdriverai.js CHANGED Viewed

@@ -1,5 +1,8 @@
 #!/usr/bin/env node
+// Initialize Sentry first, before any other modules
+const sentry = require("../lib/sentry");
 // Set process priority if possible
 const os = require("os");
 try {
@@ -10,5 +13,10 @@ try {
   // Ignore if not permitted
 }
+// Ensure Sentry flushes on exit
+process.on("beforeExit", async () => {
+  await sentry.flush();
+});
 // Run the CLI
 require("../interfaces/cli.js");

package/debugger/index.html CHANGED Viewed

@@ -307,9 +307,46 @@
         text-align: center;
         user-select: none;
       }
+      .close-button {
+        position: fixed;
+        top: 12px;
+        right: 12px;
+        z-index: 100;
+        background: rgba(0, 0, 0, 0.8);
+        border: 1px solid #444;
+        color: #fff;
+        padding: 8px 16px;
+        border-radius: 6px;
+        cursor: pointer;
+        font-size: 13px;
+        font-weight: 500;
+        pointer-events: auto;
+        transition: all 0.2s ease;
+        display: flex;
+        align-items: center;
+        gap: 6px;
+      }
+      .close-button:hover {
+        background: rgba(220, 53, 69, 0.9);
+        border-color: #dc3545;
+      }
+      .close-button svg {
+        width: 14px;
+        height: 14px;
+        fill: currentColor;
+      }
     </style>
   </head>
   <body>
+    <!-- Close window button -->
+    <button class="close-button" onclick="window.close()" title="Close this window">
+      <svg viewBox="0 0 24 24"><path d="M19 6.41L17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12z"/></svg>
+      Close
+    </button>
     <!-- Loading screen -->
     <div class="loading-screen" id="loading-screen">
       <div class="testdriver-logo">

package/docs/docs.json CHANGED Viewed

@@ -192,15 +192,8 @@
   "groups": [
     {
       "group": "Getting Started",
-      "icon": "rocket",
-      "pages": [
-        "/v7/getting-started/quickstart"
-      ]
-    },
-    {
-      "group": "Guides",
-      "icon": "book",
       "pages": [
+        "/v7/getting-started/quickstart",
         "/v7/getting-started/writing-tests",
         "/v7/getting-started/running-tests",
         "/v7/getting-started/debugging-tests",
@@ -209,7 +202,6 @@
     },
     {
       "group": "Examples",
-      "icon": "code",
       "pages": [
         "/v7/presets/chrome",
         "/v7/presets/chrome-extension",
@@ -218,8 +210,7 @@
       ]
     },
     {
-      "group": "Features",
-      "icon": "layer-group",
+      "group": "Guides",
       "pages": [
         {
           "group": "Selectorless Testing",

package/docs/v7/_drafts/architecture.mdx CHANGED Viewed

@@ -44,7 +44,6 @@ This system provides comprehensive test execution tracking, linking test runs wi
 │         │                │                                   │
 │         │ • TdTestRun    │                                   │
 │         │ • TdTestCase   │                                   │
-│         │ • TdSandbox    │                                   │
 │         │ • Replay       │                                   │
 │         └────────────────┘                                   │
 │                                                               │
@@ -95,7 +94,6 @@ Represents a complete test suite execution (e.g., `npx vitest run`).
 **Relationships:**
 - `team`: Owner team
-- `sandbox`: TdSandbox where tests ran
 - `testCases`: Collection of TdTestCase
 - `replays`: Associated Replay records
@@ -114,36 +112,13 @@ Represents an individual test within a test run.
 **Relationships:**
 - `testRun`: Parent TdTestRun
-- `replay`: Associated Replay record
-### TdSandbox
-Represents a spawned VM/sandbox instance.
-**Key Fields:**
-- `sandboxId`: Unique identifier
-- `platform`: windows | mac | linux
-- `status`: provisioning | ready | running | stopped | terminated
-- `instanceId`, `instanceType`: AWS EC2 details
-- `ipAddress`, `vncUrl`, `wsUrl`: Connection details
-- `spawnTime`, `readyTime`, `terminateTime`: Lifecycle timestamps
-- `dashcamAuth`: Whether dashcam was authenticated
-- `dashcamProjectId`: Dashcam project for replays
-**Relationships:**
-- `team`: Owner team
-- `user`: User who spawned it
-- `testRuns`: Tests that ran on this sandbox
-- `replays`: Dashcam recordings from this sandbox
-**Note:** Sandbox creation/updates happen via WebSocket (not REST API) as part of the sandbox provisioning flow.
+- `replay`: Associated Replay recor
 ### Replay (Extended)
 Existing model extended with test run associations.
 **New Fields:**
 - `tdTestRun`: Associated test run
 - `tdTestCase`: Associated test case
-- `tdSandbox`: Sandbox where recorded
 ## API Endpoints