npm - testdriverai - Versions diffs - 7.8.0 → 7.9.0-test.1 - Mend

testdriverai 7.8.0 → 7.9.0-test.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

package/agent/index.js +12 -0
package/agent/lib/http.js +21 -3
package/agent/lib/logger.js +15 -0
package/agent/lib/provision-commands.js +176 -0
package/agent/lib/sandbox.js +667 -118
package/agent/lib/sdk.js +1 -20
package/ai/skills/testdriver-find/SKILL.md +14 -20
package/docs/_data/examples-manifest.json +46 -46
package/docs/_scripts/extract-example-urls.js +67 -72
package/docs/docs.json +2 -1
package/docs/v7/examples/ai.mdx +1 -1
package/docs/v7/examples/assert.mdx +1 -1
package/docs/v7/examples/captcha-api.mdx +1 -1
package/docs/v7/examples/chrome-extension.mdx +1 -1
package/docs/v7/examples/drag-and-drop.mdx +1 -1
package/docs/v7/examples/element-not-found.mdx +1 -1
package/docs/v7/examples/exec-output.mdx +1 -1
package/docs/v7/examples/exec-pwsh.mdx +1 -1
package/docs/v7/examples/focus-window.mdx +1 -1
package/docs/v7/examples/hover-image.mdx +1 -1
package/docs/v7/examples/hover-text.mdx +1 -1
package/docs/v7/examples/installer.mdx +1 -1
package/docs/v7/examples/launch-vscode-linux.mdx +1 -1
package/docs/v7/examples/match-image.mdx +1 -1
package/docs/v7/examples/press-keys.mdx +1 -1
package/docs/v7/examples/scroll-keyboard.mdx +1 -1
package/docs/v7/examples/scroll-until-image.mdx +1 -1
package/docs/v7/examples/scroll-until-text.mdx +1 -1
package/docs/v7/examples/scroll.mdx +1 -1
package/docs/v7/examples/type.mdx +1 -1
package/docs/v7/examples/windows-installer.mdx +1 -1
package/docs/v7/find.mdx +14 -20
package/docs/v7/test-results-json.mdx +258 -0
package/examples/scroll-keyboard.test.mjs +1 -1
package/examples/scroll.test.mjs +1 -12
package/interfaces/vitest-plugin.mjs +167 -51
package/lib/core/Dashcam.js +16 -22
package/lib/environments.json +8 -4
package/lib/github-comment.mjs +58 -40
package/lib/init-project.js +5 -67
package/lib/resolve-channel.js +39 -10
package/lib/sentry.js +47 -23
package/lib/vitest/hooks.mjs +117 -20
package/manual/exec-stream-logs.test.mjs +25 -0
package/mcp-server/dist/server.mjs +28 -8
package/mcp-server/src/server.ts +31 -8
package/package.json +2 -1
package/sdk.d.ts +4 -0
package/sdk.js +42 -12
package/setup/aws/install-dev-runner.sh +79 -0
package/setup/aws/spawn-runner.sh +165 -0
package/test-sentry-span.js +35 -0
package/vitest.config.mjs +7 -3
package/vitest.runner.config.mjs +33 -0
package/docs/v7/_drafts/core.mdx +0 -458

package/lib/vitest/hooks.mjs CHANGED Viewed

@@ -42,14 +42,14 @@ function checkVitestVersion() {
     if (major < MINIMUM_VITEST_VERSION) {
       throw new Error(
         `TestDriver requires Vitest >= ${MINIMUM_VITEST_VERSION}.0.0, but found ${version}. ` +
-          `Please upgrade Vitest: npm install vitest@latest`,
+        `Please upgrade Vitest: npm install vitest@latest`,
       );
     }
   } catch (err) {
     if (err.code === "MODULE_NOT_FOUND") {
       throw new Error(
         "TestDriver requires Vitest to be installed. " +
-          "Please install it: npm install vitest@latest",
+        "Please install it: npm install vitest@latest",
       );
     }
     throw err;
@@ -181,18 +181,33 @@ function setupConsoleSpy(client, taskId) {
 /**
  * Unregister a client so its sandbox no longer receives forwarded logs.
- * When the last client is removed we restore the original console methods so
- * the Vitest worker fork can exit cleanly (unreleased vi.spyOn mocks prevent
- * the worker from shutting down, producing "Worker exited unexpectedly").
- * If another test starts later (e.g. a retry), installConsoleSpy() will
- * re-install the spy on demand.
+ *
+ * Between sequential `it()` blocks we intentionally keep the spies installed.
+ * The `bufferConsoleToClients` function is a no-op when `activeClients` is
+ * empty, so leaving the spy in place is harmless and avoids a non-atomic
+ * restore/re-install race that can corrupt console method references.
+ *
+ * Spies are torn down once at process exit so the Vitest worker fork can
+ * shut down cleanly (unreleased vi.spyOn mocks prevent exit).
+ *
  * @param {import('../../sdk.js').default} client - TestDriver client instance
  */
 function cleanupConsoleSpy(client) {
   _consoleSpy.activeClients.delete(client);
-  // Restore spies when no tests need them — allows clean worker exit
-  if (_consoleSpy.activeClients.size === 0 && _consoleSpy.spies) {
+  if (debugConsoleSpy) {
+    process.stdout.write(
+      `[DEBUG cleanupConsoleSpy] clients remaining: ${_consoleSpy.activeClients.size}\n`,
+    );
+  }
+}
+/**
+ * Tear down the singleton console spy completely.
+ * Called once on process exit so the Vitest worker can shut down cleanly.
+ */
+function teardownConsoleSpy() {
+  if (_consoleSpy.spies) {
     _consoleSpy.spies.log.mockRestore();
     _consoleSpy.spies.error.mockRestore();
     _consoleSpy.spies.warn.mockRestore();
@@ -202,21 +217,26 @@ function cleanupConsoleSpy(client) {
     _consoleSpy.installed = false;
     if (debugConsoleSpy) {
-      process.stdout.write("[DEBUG cleanupConsoleSpy] All spies restored\n");
+      process.stdout.write("[DEBUG teardownConsoleSpy] All spies restored\n");
     }
   }
-  if (debugConsoleSpy) {
-    process.stdout.write(
-      `[DEBUG cleanupConsoleSpy] clients remaining: ${_consoleSpy.activeClients.size}\n`,
-    );
-  }
 }
+// Restore console spies on process exit so the Vitest worker can exit cleanly
+process.on("exit", teardownConsoleSpy);
 // Weak maps to store instances per test context
 const testDriverInstances = new WeakMap();
 const lifecycleHandlers = new WeakMap();
+/**
+ * Module-level promise tracking the most recent test's disconnect.
+ * When sequential `it()` blocks run, the next test awaits this promise
+ * before connecting — ensuring the previous sandbox is fully torn down
+ * even if the cleanup's disconnect timeout fired early.
+ */
+let _pendingDisconnect = null;
 /**
  * Upload buffered SDK + console logs directly to S3 via the existing Log system.
  * Extracts the replayId from the dashcam URL, calls POST /api/v1/logs to create
@@ -403,6 +423,11 @@ export function TestDriver(context, options = {}) {
     config.apiRoot = process.env.TD_API_ROOT;
   }
+  // Use TD_E2B_TEMPLATE_ID from environment if not provided in config
+  if (!config.e2bTemplateId && process.env.TD_E2B_TEMPLATE_ID) {
+    config.e2bTemplateId = process.env.TD_E2B_TEMPLATE_ID;
+  }
   const testdriver = new TestDriverSDK(apiKey, config);
   testdriver.__vitestContext = context.task;
   testdriver._debugOnFailure = mergedOptions.debugOnFailure || false;
@@ -431,6 +456,14 @@ export function TestDriver(context, options = {}) {
   const debugConsoleSpy = process.env.TD_DEBUG_CONSOLE_SPY === "true";
   testdriver.__connectionPromise = (async () => {
+    // Wait for any previous test's disconnect to fully complete.
+    // This prevents the new sandbox connection from racing with a
+    // lingering disconnect when sequential `it()` blocks run.
+    if (_pendingDisconnect) {
+      await _pendingDisconnect.catch(() => {});
+      _pendingDisconnect = null;
+    }
     if (debugConsoleSpy) {
       console.log(
         "[DEBUG] Before auth - sandbox.instanceSocketConnected:",
@@ -644,15 +677,79 @@ export function TestDriver(context, options = {}) {
       // Clean up console spies
       cleanupConsoleSpy(currentInstance);
+      // Build test result metadata for JSON report output
+      {
+        const sdkPkg = require("../../package.json");
+        const inst = currentInstance.getInstance?.() || {};
+        const sbx = currentInstance.sandbox || {};
+        const apiRoot = currentInstance.config?.TD_API_ROOT || null;
+        context.task.meta.testResult = {
+          // Versions
+          sdkVersion: sdkPkg.version || null,
+          apiVersion: currentInstance._apiVersion || null,
+          runnerVersionBefore: inst.runnerVersionBefore || null,
+          runnerVersionAfter: inst.runnerVersionAfter || null,
+          wasUpdated: inst.wasUpdated || false,
+          // URLs
+          apiUrl: apiRoot,
+          vncUrl: inst.vncUrl || inst.url || null,
+          // Dates
+          date: new Date().toISOString(),
+          // Team / session
+          teamId: sbx._teamId || null,
+          sessionId: currentInstance.getSessionId?.() || null,
+          // Test info
+          testFile: context.task.meta.testFile || null,
+          testName: context.task.name || null,
+          suiteName: context.task.suite?.name || null,
+          // Test result
+          testPassed: context.task.result?.state === "pass",
+          error: context.task.result?.errors?.[0]?.message || null,
+          errorStack: context.task.result?.errors?.[0]?.stack || null,
+          // Infrastructure
+          sandboxId: inst.sandboxId || inst.instanceId || null,
+          instanceId: inst.instanceId || null,
+          os: currentInstance.os || inst.os || null,
+          amiId: inst.amiId || null,
+          e2bTemplateId: inst.e2bTemplateId || null,
+          imageVersion: inst.imageVersion || null,
+          // Realtime
+          realtimeChannel: inst.channelName || sbx._channelName || null,
+          realtimeMessageCount: typeof sbx.getPublishCount === "function" ? sbx.getPublishCount() : 0,
+          // Interactions
+          interactions: currentInstance._interactionStats
+            ? { ...currentInstance._interactionStats, byType: { ...currentInstance._interactionStats.byType } }
+            : { total: 0, cached: 0, byType: {} },
+        };
+      }
       // Wait for connection to finish if it was initiated
       if (currentInstance.__connectionPromise) {
-        await currentInstance.__connectionPromise.catch(() => {}); // Ignore connection errors during cleanup
+        await currentInstance.__connectionPromise.catch(() => { }); // Ignore connection errors during cleanup
       }
-      // Disconnect with timeout
+      // Disconnect — track the promise at module level so the *next* test
+      // can await it before connecting, even if the timeout fires first.
+      const disconnectPromise = currentInstance.disconnect().catch((err) => {
+        console.error("Error during disconnect:", err);
+      });
+      _pendingDisconnect = disconnectPromise;
+      // Allow up to 30 s for Ably presence leave / channel detach.
+      // If it takes longer, cleanup resolves but _pendingDisconnect
+      // keeps the reference so the next test still waits.
       await Promise.race([
-        currentInstance.disconnect(),
-        new Promise((resolve) => setTimeout(resolve, 5000)), // 5s timeout for disconnect
+        disconnectPromise,
+        new Promise((resolve) => setTimeout(resolve, 30000)),
       ]);
     } catch (error) {
       console.error("Error disconnecting client:", error);

package/manual/exec-stream-logs.test.mjs ADDED Viewed

@@ -0,0 +1,25 @@
+import { describe, expect, it } from "vitest";
+import { TestDriver } from "../lib/vitest/hooks.mjs";
+import { getDefaults } from "../examples/config.mjs";
+describe("Exec Log Streaming", () => {
+  it("should stream exec logs every second for 20 seconds", async (context) => {
+    const testdriver = TestDriver(context, { ...getDefaults(context), headless: true });
+    await testdriver.provision.chrome({ url: "about:blank" });
+    const code = `for i in $(seq 1 20); do echo "log line $i at $(date +%T)"; sleep 1; done`;
+    const result = await testdriver.exec({
+      language: "sh",
+      code,
+      timeout: 30000,
+    });
+    console.log("exec result:", result);
+    // Verify we got all 20 log lines
+    for (let i = 1; i <= 20; i++) {
+      expect(result).toContain(`log line ${i}`);
+    }
+  });
+});

package/mcp-server/dist/server.mjs CHANGED Viewed

@@ -26,18 +26,33 @@ import { sessionManager } from "./session.js";
 const sdkRoot = path.join(path.dirname(fileURLToPath(import.meta.url)), "..", "..");
 const packageJson = JSON.parse(fs.readFileSync(path.join(sdkRoot, "package.json"), "utf-8"));
 const version = packageJson.version || "1.0.0";
-// Derive release channel from package version prerelease tag (e.g. "7.6.0-test.5" → "test")
+// Derive release channel and infrastructure environment from package version
 import semver from "semver";
-const KNOWN_CHANNELS = new Set(["dev", "test", "canary", "latest"]);
-function resolveReleaseChannel(ver) {
-    if (process.env.TD_CHANNEL && KNOWN_CHANNELS.has(process.env.TD_CHANNEL))
+const CHANNEL_TO_ENV = {
+    dev: "dev",
+    test: "staging",
+    canary: "production",
+    stable: "production",
+};
+const VALID_CHANNELS = new Set(Object.keys(CHANNEL_TO_ENV));
+const VALID_ENVS = new Set(["dev", "staging", "production"]);
+function resolveChannel(ver) {
+    if (process.env.TD_CHANNEL && VALID_CHANNELS.has(process.env.TD_CHANNEL))
         return process.env.TD_CHANNEL;
+    if (process.env.TD_ENV && VALID_CHANNELS.has(process.env.TD_ENV))
+        return process.env.TD_ENV;
     const pre = semver.prerelease(ver);
-    if (pre && pre.length > 0 && KNOWN_CHANNELS.has(String(pre[0])))
+    if (pre && pre.length > 0 && VALID_CHANNELS.has(String(pre[0])))
         return String(pre[0]);
-    return "latest";
+    return "stable";
+}
+function resolveSentryEnvironment(ver) {
+    if (process.env.TD_ENV && VALID_ENVS.has(process.env.TD_ENV))
+        return process.env.TD_ENV;
+    return CHANNEL_TO_ENV[resolveChannel(ver)] || "production";
 }
-const releaseChannel = resolveReleaseChannel(version);
+const activeChannel = resolveChannel(version);
+const sentryEnvironment = resolveSentryEnvironment(version);
 const isSentryEnabled = () => {
     if (process.env.TD_TELEMETRY === "false") {
         return false;
@@ -49,7 +64,7 @@ if (isSentryEnabled()) {
     Sentry.init({
         dsn: process.env.SENTRY_DSN ||
             "https://452bd5a00dbd83a38ee8813e11c57694@o4510262629236736.ingest.us.sentry.io/4510480443637760",
-        environment: releaseChannel,
+        environment: sentryEnvironment,
         release: version,
         sampleRate: 1.0,
         tracesSampleRate: 1.0,
@@ -57,6 +72,7 @@ if (isSentryEnabled()) {
         integrations: [Sentry.httpIntegration(), Sentry.nodeContextIntegration()],
         initialScope: {
             tags: {
+                channel: activeChannel,
                 platform: os.platform(),
                 arch: os.arch(),
                 nodeVersion: process.version,
@@ -84,6 +100,10 @@ if (isSentryEnabled()) {
             if (error && typeof error === "object" && "name" in error && error.name === "TestFailure") {
                 return null;
             }
+            // Filter out ElementNotFoundError - expected test outcome, not a crash
+            if (error && typeof error === "object" && "name" in error && error.name === "ElementNotFoundError") {
+                return null;
+            }
             return event;
         },
     });

package/mcp-server/src/server.ts CHANGED Viewed

@@ -34,16 +34,33 @@ const sdkRoot = path.join(path.dirname(fileURLToPath(import.meta.url)), "..", ".
 const packageJson = JSON.parse(fs.readFileSync(path.join(sdkRoot, "package.json"), "utf-8"));
 const version = packageJson.version || "1.0.0";
-// Derive release channel from package version prerelease tag (e.g. "7.6.0-test.5" → "test")
+// Derive release channel and infrastructure environment from package version
 import semver from "semver";
-const KNOWN_CHANNELS = new Set(["dev", "test", "canary", "latest"]);
-function resolveReleaseChannel(ver: string): string {
-  if (process.env.TD_CHANNEL && KNOWN_CHANNELS.has(process.env.TD_CHANNEL)) return process.env.TD_CHANNEL;
+const CHANNEL_TO_ENV: Record<string, string> = {
+  dev: "dev",
+  test: "staging",
+  canary: "production",
+  stable: "production",
+};
+const VALID_CHANNELS = new Set(Object.keys(CHANNEL_TO_ENV));
+const VALID_ENVS = new Set(["dev", "staging", "production"]);
+function resolveChannel(ver: string): string {
+  if (process.env.TD_CHANNEL && VALID_CHANNELS.has(process.env.TD_CHANNEL)) return process.env.TD_CHANNEL;
+  if (process.env.TD_ENV && VALID_CHANNELS.has(process.env.TD_ENV)) return process.env.TD_ENV;
   const pre = semver.prerelease(ver);
-  if (pre && pre.length > 0 && KNOWN_CHANNELS.has(String(pre[0]))) return String(pre[0]);
-  return "latest";
+  if (pre && pre.length > 0 && VALID_CHANNELS.has(String(pre[0]))) return String(pre[0]);
+  return "stable";
+}
+function resolveSentryEnvironment(ver: string): string {
+  if (process.env.TD_ENV && VALID_ENVS.has(process.env.TD_ENV)) return process.env.TD_ENV;
+  return CHANNEL_TO_ENV[resolveChannel(ver)] || "production";
 }
-const releaseChannel = resolveReleaseChannel(version);
+const activeChannel = resolveChannel(version);
+const sentryEnvironment = resolveSentryEnvironment(version);
 const isSentryEnabled = () => {
   if (process.env.TD_TELEMETRY === "false") {
@@ -58,7 +75,7 @@ if (isSentryEnabled()) {
     dsn:
       process.env.SENTRY_DSN ||
       "https://452bd5a00dbd83a38ee8813e11c57694@o4510262629236736.ingest.us.sentry.io/4510480443637760",
-    environment: releaseChannel,
+    environment: sentryEnvironment,
     release: version,
     sampleRate: 1.0,
     tracesSampleRate: 1.0,
@@ -66,6 +83,7 @@ if (isSentryEnabled()) {
     integrations: [Sentry.httpIntegration(), Sentry.nodeContextIntegration()],
     initialScope: {
       tags: {
+        channel: activeChannel,
         platform: os.platform(),
         arch: os.arch(),
         nodeVersion: process.version,
@@ -99,6 +117,11 @@ if (isSentryEnabled()) {
       if (error && typeof error === "object" && "name" in error && (error as { name: string }).name === "TestFailure") {
         return null;
       }
+      // Filter out ElementNotFoundError - expected test outcome, not a crash
+      if (error && typeof error === "object" && "name" in error && (error as { name: string }).name === "ElementNotFoundError") {
+        return null;
+      }
       return event;
     },

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "testdriverai",
-  "version": "7.8.0",
+  "version": "7.9.0-test.1",
   "description": "Next generation autonomous AI agent for end-to-end testing of web & desktop",
   "main": "sdk.js",
   "types": "sdk.d.ts",
@@ -116,6 +116,7 @@
   },
   "overrides": {
     "glob": "^11.0.1",
+    "obug": "2.1.1",
     "rimraf": "^5.0.10"
   },
   "peerDependencies": {

package/sdk.d.ts CHANGED Viewed

@@ -273,6 +273,8 @@ export interface TestDriverOptions {
   sandboxAmi?: string;
   /** EC2 instance type for sandbox (e.g., 'i3.metal') */
   sandboxInstance?: string;
+  /** E2B template ID to use when creating the sandbox (e.g., 'my-template-id') */
+  e2bTemplateId?: string;
   /** Cache key for element finding operations. If provided, enables caching tied to this key */
   cacheKey?: string;
   /** Reconnect to the last used sandbox instead of creating a new one. When true, provision methods (chrome, vscode, installer, etc.) will be skipped since the application is already running. Throws error if no previous sandbox exists. */
@@ -327,6 +329,8 @@ export interface ConnectOptions {
   sandboxAmi?: string;
   /** EC2 instance type for sandbox (e.g., 'i3.metal') */
   sandboxInstance?: string;
+  /** E2B template ID to use when creating the sandbox (e.g., 'my-template-id') */
+  e2bTemplateId?: string;
   /** Operating system for the sandbox (default: 'linux') */
   os?: "windows" | "linux";
   /**

package/sdk.js CHANGED Viewed

@@ -481,7 +481,7 @@ class Element {
       let cacheKey = null;
       let cacheThreshold = null;
       let perCommandThresholds = null; // Per-command { screen, element } override
-      let zoom = false; // Default to disabled, enable with zoom: true
+      let zoom = true; // Default to enabled
       let perCommandAi = null; // Per-command AI config override
       let minConfidence = null; // Minimum confidence threshold
@@ -494,8 +494,8 @@ class Element {
         // New: options is an object with cacheKey and/or cacheThreshold
         cacheKey = options.cacheKey || null;
         cacheThreshold = options.cacheThreshold ?? null;
-        // zoom defaults to false unless explicitly set to true
-        zoom = options.zoom === true;
+        // zoom defaults to true unless explicitly set to false
+        zoom = options.zoom !== false;
         // Minimum confidence threshold: fail find if AI confidence is below this value
         minConfidence = options.confidence ?? null;
         // Element type hint for prompt wrapping
@@ -568,7 +568,7 @@ class Element {
         cacheKey: cacheKey,
         os: this.sdk.os,
         resolution: this.sdk.resolution,
-        zoom: zoom,
+        zoom: zoom === true ? 1 : zoom === false ? 0 : zoom,
         confidence: minConfidence,
         type: elementType,
         ai: {
@@ -623,6 +623,11 @@ class Element {
     // Track find interaction once at the end (fire-and-forget, don't block)
     const sessionId = this.sdk.getSessionId();
+    const findCacheHit = response?.cacheHit || response?.cache_hit || response?.cached || false;
+    // Increment local interaction counters
+    this.sdk._interactionStats.total++;
+    this.sdk._interactionStats.byType.find = (this.sdk._interactionStats.byType.find || 0) + 1;
+    if (findCacheHit) this.sdk._interactionStats.cached++;
     if (sessionId && this.sdk.apiClient) {
       this.sdk.apiClient
         .req("interaction/track", {
@@ -632,11 +637,7 @@ class Element {
           timestamp: absoluteTimestamp, // Absolute epoch timestamp - frontend calculates relative using clientStartDate
           success: this._found,
           error: findError,
-          cacheHit:
-            response?.cacheHit ||
-            response?.cache_hit ||
-            response?.cached ||
-            false,
+          cacheHit: findCacheHit,
           selector: response?.selector,
           selectorUsed: !!response?.selector,
           confidence: response?.confidence ?? null,
@@ -1498,6 +1499,7 @@ class TestDriverSDK {
     // Store sandbox configuration options
     this.sandboxAmi = options.sandboxAmi || null;
     this.sandboxInstance = options.sandboxInstance || null;
+    this.e2bTemplateId = options.e2bTemplateId || null;
     // Store reconnect preference from options
     this.reconnect =
@@ -1616,6 +1618,12 @@ class TestDriverSDK {
     // Uploaded to S3 at cleanup so they can be displayed alongside dashcam replays.
     this._logBuffer = [];
+    // API version discovered by _logEnvironmentInfo()
+    this._apiVersion = null;
+    // Local interaction counters — incremented at each interaction/track call site
+    this._interactionStats = { total: 0, cached: 0, byType: {} };
     // Set up event listeners once (they live for the lifetime of the SDK instance)
     this._setupLogging();
@@ -2716,6 +2724,7 @@ CAPTCHA_SOLVER_EOF`,
    * @param {string} options.ip - Direct IP address to connect to
    * @param {string} options.sandboxAmi - AMI to use for the sandbox
    * @param {string} options.sandboxInstance - Instance type for the sandbox
+   * @param {string} options.e2bTemplateId - E2B template ID to use when creating the sandbox
    * @param {string} options.os - Operating system for the sandbox (windows or linux)
    * @param {boolean} options.reuseConnection - Reuse recent connection if available (default: true)
    * @returns {Promise<Object>} Sandbox instance details
@@ -2804,6 +2813,12 @@ CAPTCHA_SOLVER_EOF`,
     } else if (this.sandboxInstance) {
       this.agent.sandboxInstance = this.sandboxInstance;
     }
+    // Use e2bTemplateId from connectOptions if provided, otherwise fall back to constructor value
+    if (connectOptions.e2bTemplateId !== undefined) {
+      this.agent.e2bTemplateId = connectOptions.e2bTemplateId;
+    } else if (this.e2bTemplateId) {
+      this.agent.e2bTemplateId = this.e2bTemplateId;
+    }
     // Use os from connectOptions if provided, otherwise fall back to this.os
     if (connectOptions.os !== undefined) {
       this.agent.sandboxOs = connectOptions.os;
@@ -3193,6 +3208,11 @@ CAPTCHA_SOLVER_EOF`,
         // Track successful findAll interaction (fire-and-forget, don't block)
         const sessionId = this.getSessionId();
+        const findAllCacheHit = response.cached || false;
+        // Increment local interaction counters
+        this._interactionStats.total++;
+        this._interactionStats.byType.findAll = (this._interactionStats.byType.findAll || 0) + 1;
+        if (findAllCacheHit) this._interactionStats.cached++;
         if (sessionId && this.apiClient) {
           this.apiClient
             .req("interaction/track", {
@@ -3202,7 +3222,7 @@ CAPTCHA_SOLVER_EOF`,
               timestamp: absoluteTimestamp, // Absolute epoch timestamp - frontend calculates relative using clientStartDate
               success: true,
               input: { count: elements.length },
-              cacheHit: response.cached || false,
+              cacheHit: findAllCacheHit,
               selector: response.selector,
               selectorUsed: !!response.selector,
               screenshotUrl: response.screenshotKey ?? null,
@@ -3248,6 +3268,11 @@ CAPTCHA_SOLVER_EOF`,
         // No elements found - track interaction (fire-and-forget, don't block)
         const sessionId = this.getSessionId();
+        const noResultCacheHit = response?.cached || false;
+        // Increment local interaction counters
+        this._interactionStats.total++;
+        this._interactionStats.byType.findAll = (this._interactionStats.byType.findAll || 0) + 1;
+        if (noResultCacheHit) this._interactionStats.cached++;
         if (sessionId && this.apiClient) {
           this.apiClient
             .req("interaction/track", {
@@ -3258,7 +3283,7 @@ CAPTCHA_SOLVER_EOF`,
               success: false,
               error: "No elements found",
               input: { count: 0 },
-              cacheHit: response?.cached || false,
+              cacheHit: noResultCacheHit,
               selector: response?.selector,
               selectorUsed: !!response?.selector,
               screenshotUrl: response?.screenshotKey ?? null,
@@ -3292,6 +3317,9 @@ CAPTCHA_SOLVER_EOF`,
       // Track findAll error interaction (fire-and-forget, don't block)
       const sessionId = this.getSessionId();
+      // Increment local interaction counters
+      this._interactionStats.total++;
+      this._interactionStats.byType.findAll = (this._interactionStats.byType.findAll || 0) + 1;
       if (sessionId && this.apiClient) {
         this.apiClient
           .req("interaction/track", {
@@ -3817,7 +3845,7 @@ CAPTCHA_SOLVER_EOF`,
     const apiRoot = this.config?.TD_API_ROOT || 'unknown';
     const apiKey = this.config?.TD_API_KEY || '';
     const maskedKey = apiKey.length > 4 ? '***' + apiKey.slice(-4) : '(not set)';
-    const env = process.env.TD_ENV || 'unknown';
+    const env = process.env.TD_CHANNEL || process.env.TD_ENV || 'unknown';
     const os = this.agent?.options?.os || process.env.TD_OS || 'linux';
     const sdkVersion = require('./package.json').version;
@@ -3843,6 +3871,8 @@ CAPTCHA_SOLVER_EOF`,
       res.on('end', () => {
         try {
           const info = JSON.parse(data);
+          // Persist API version for test result metadata
+          this._apiVersion = info.version || null;
           const commit = info.commit || 'unknown';
           const shortCommit = commit.substring(0, 7);
           const commitUrl = commit !== 'unknown'

package/setup/aws/install-dev-runner.sh ADDED Viewed

@@ -0,0 +1,79 @@
+#!/usr/bin/env bash
+set -euo pipefail
+# Usage: ./install-dev-runner.sh <instance-id>
+INSTANCE_ID="${1:?Usage: $0 <instance-id>}"
+AWS_REGION="${AWS_REGION:-us-east-2}"
+RUNNER_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../../../runner" && pwd)"
+echo "Packing local runner..."
+TMPDIR=$(mktemp -d)
+pushd "$RUNNER_DIR" > /dev/null
+npm pack --pack-destination "$TMPDIR" > /dev/null 2>&1
+TARBALL=$(ls "$TMPDIR"/*.tgz)
+popd > /dev/null
+echo "Tarball: $TARBALL"
+echo "Uploading to S3..."
+S3_KEY="runner-dev/$(date +%s)-$(openssl rand -hex 4)/runner.tgz"
+aws s3 cp "$TARBALL" "s3://v7-transfer/${S3_KEY}" --region "$AWS_REGION" > /dev/null
+DOWNLOAD_URL=$(aws s3 presign "s3://v7-transfer/${S3_KEY}" --expires-in 900 --region "$AWS_REGION")
+rm -rf "$TMPDIR"
+echo "Creating SSM params file..."
+# Write Python script to temp file to generate valid JSON
+PYTHON_SCRIPT=$(mktemp --suffix=.py)
+cat > "$PYTHON_SCRIPT" << 'PYEOF'
+import json
+import sys
+url = sys.argv[1]
+commands = [
+    "Write-Host '=== Stopping runner ==='",
+    "Stop-ScheduledTask -TaskName RunTestDriverAgent -ErrorAction SilentlyContinue",
+    "Stop-Process -Name node -Force -ErrorAction SilentlyContinue",
+    "Start-Sleep -Seconds 2",
+    "Set-Location 'C:\\testdriver\\sandbox-agent'",
+    "$tarball = 'C:\\Windows\\Temp\\runner-dev.tgz'",
+    f"Invoke-WebRequest -Uri '{url}' -OutFile $tarball",
+    "Write-Host 'Tarball size:'; (Get-Item $tarball).Length",
+    "Remove-Item -Path lib -Recurse -Force -ErrorAction SilentlyContinue",
+    "tar -xzf $tarball --strip-components=1 -C .",
+    "Get-Content 'package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
+    "Write-Host '=== Starting runner ==='",
+    "Start-ScheduledTask -TaskName RunTestDriverAgent",
+    "Start-Sleep -Seconds 3",
+    "Get-Content 'C:\\testdriver\\log.txt' -Tail 20"
+]
+params = {"commands": commands}
+print(json.dumps(params))
+PYEOF
+python3 "$PYTHON_SCRIPT" "$DOWNLOAD_URL" > /tmp/ssm-install-params.json
+rm "$PYTHON_SCRIPT"
+echo "Sending SSM command..."
+CMD_JSON=$(aws ssm send-command \
+  --region "$AWS_REGION" \
+  --instance-ids "$INSTANCE_ID" \
+  --document-name "AWS-RunPowerShellScript" \
+  --parameters "file:///tmp/ssm-install-params.json" \
+  --output json)
+COMMAND_ID=$(echo "$CMD_JSON" | jq -r '.Command.CommandId')
+echo "Command ID: $COMMAND_ID"
+echo "Waiting for completion..."
+aws ssm wait command-executed --region "$AWS_REGION" --command-id "$COMMAND_ID" --instance-id "$INSTANCE_ID" || true
+echo "Getting output..."
+aws ssm get-command-invocation \
+  --region "$AWS_REGION" \
+  --command-id "$COMMAND_ID" \
+  --instance-id "$INSTANCE_ID" \
+  --query 'StandardOutputContent' \
+  --output text