testdriverai 7.8.0-test.7 → 7.8.0-test.71

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (98) hide show
  1. package/agent/index.js +18 -5
  2. package/agent/lib/commands.js +3 -2
  3. package/agent/lib/http.js +162 -0
  4. package/agent/lib/logger.js +15 -0
  5. package/agent/lib/sandbox.js +554 -209
  6. package/agent/lib/sdk.js +5 -22
  7. package/agent/lib/system.js +25 -65
  8. package/ai/skills/testdriver-cache/SKILL.md +221 -0
  9. package/ai/skills/testdriver-errors/SKILL.md +246 -0
  10. package/ai/skills/testdriver-events/SKILL.md +356 -0
  11. package/ai/skills/testdriver-find/SKILL.md +14 -20
  12. package/ai/skills/testdriver-mcp/SKILL.md +7 -0
  13. package/ai/skills/testdriver-provision/SKILL.md +331 -0
  14. package/ai/skills/testdriver-redraw/SKILL.md +214 -0
  15. package/ai/skills/testdriver-running-tests/SKILL.md +1 -1
  16. package/ai/skills/testdriver-screenshots/SKILL.md +184 -0
  17. package/docs/_data/examples-manifest.json +46 -46
  18. package/docs/_scripts/extract-example-urls.js +67 -72
  19. package/docs/changelog.mdx +148 -8
  20. package/docs/docs.json +46 -38
  21. package/docs/images/content/vscode/v7-chat.png +0 -0
  22. package/docs/images/content/vscode/v7-choose-agent.png +0 -0
  23. package/docs/images/content/vscode/v7-full.png +0 -0
  24. package/docs/images/content/vscode/v7-onboarding.png +0 -0
  25. package/docs/v7/cache.mdx +223 -0
  26. package/docs/v7/copilot/auto-healing.mdx +265 -0
  27. package/docs/v7/copilot/creating-tests.mdx +156 -0
  28. package/docs/v7/copilot/github.mdx +143 -0
  29. package/docs/v7/copilot/running-tests.mdx +149 -0
  30. package/docs/v7/copilot/setup.mdx +143 -0
  31. package/docs/v7/enterprise.mdx +3 -110
  32. package/docs/v7/errors.mdx +248 -0
  33. package/docs/v7/events.mdx +358 -0
  34. package/docs/v7/examples/ai.mdx +1 -1
  35. package/docs/v7/examples/assert.mdx +1 -1
  36. package/docs/v7/examples/captcha-api.mdx +1 -1
  37. package/docs/v7/examples/chrome-extension.mdx +1 -1
  38. package/docs/v7/examples/drag-and-drop.mdx +1 -1
  39. package/docs/v7/examples/element-not-found.mdx +1 -1
  40. package/docs/v7/examples/exec-output.mdx +85 -0
  41. package/docs/v7/examples/exec-pwsh.mdx +83 -0
  42. package/docs/v7/examples/focus-window.mdx +62 -0
  43. package/docs/v7/examples/hover-image.mdx +1 -1
  44. package/docs/v7/examples/hover-text.mdx +1 -1
  45. package/docs/v7/examples/installer.mdx +1 -1
  46. package/docs/v7/examples/launch-vscode-linux.mdx +1 -1
  47. package/docs/v7/examples/match-image.mdx +1 -1
  48. package/docs/v7/examples/press-keys.mdx +1 -1
  49. package/docs/v7/examples/scroll-keyboard.mdx +1 -1
  50. package/docs/v7/examples/scroll-until-image.mdx +1 -1
  51. package/docs/v7/examples/scroll-until-text.mdx +1 -1
  52. package/docs/v7/examples/scroll.mdx +1 -1
  53. package/docs/v7/examples/type.mdx +1 -1
  54. package/docs/v7/examples/windows-installer.mdx +1 -1
  55. package/docs/v7/find.mdx +14 -20
  56. package/docs/v7/{cloud.mdx → hosted.mdx} +43 -5
  57. package/docs/v7/mcp.mdx +9 -0
  58. package/docs/v7/provision.mdx +333 -0
  59. package/docs/v7/quickstart.mdx +30 -2
  60. package/docs/v7/redraw.mdx +216 -0
  61. package/docs/v7/running-tests.mdx +1 -1
  62. package/docs/v7/screenshots.mdx +186 -0
  63. package/docs/v7/self-hosted.mdx +127 -44
  64. package/docs/v7/test-results-json.mdx +258 -0
  65. package/examples/scroll-keyboard.test.mjs +1 -1
  66. package/examples/scroll.test.mjs +1 -12
  67. package/interfaces/logger.js +0 -12
  68. package/interfaces/vitest-plugin.mjs +170 -51
  69. package/lib/core/Dashcam.js +30 -23
  70. package/lib/environments.json +22 -0
  71. package/lib/github-comment.mjs +58 -40
  72. package/lib/init-project.js +5 -67
  73. package/lib/resolve-channel.js +42 -12
  74. package/lib/sentry.js +47 -23
  75. package/lib/vitest/hooks.mjs +63 -3
  76. package/{examples → manual}/drag-and-drop.test.mjs +1 -1
  77. package/manual/exec-stream-logs.test.mjs +25 -0
  78. package/mcp-server/dist/server.mjs +28 -8
  79. package/mcp-server/src/server.ts +31 -8
  80. package/package.json +4 -3
  81. package/sdk.d.ts +4 -0
  82. package/sdk.js +45 -15
  83. package/setup/aws/install-dev-runner.sh +79 -0
  84. package/setup/aws/spawn-runner.sh +165 -0
  85. package/test-sentry-span.js +35 -0
  86. package/vitest.config.mjs +22 -34
  87. package/vitest.runner.config.mjs +33 -0
  88. /package/{examples → manual}/flake-diffthreshold-001.test.mjs +0 -0
  89. /package/{examples → manual}/flake-diffthreshold-01.test.mjs +0 -0
  90. /package/{examples → manual}/flake-diffthreshold-05.test.mjs +0 -0
  91. /package/{examples → manual}/flake-noredraw-cache.test.mjs +0 -0
  92. /package/{examples → manual}/flake-noredraw-nocache.test.mjs +0 -0
  93. /package/{examples → manual}/flake-redraw-cache.test.mjs +0 -0
  94. /package/{examples → manual}/flake-redraw-nocache.test.mjs +0 -0
  95. /package/{examples → manual}/flake-rocket-match.test.mjs +0 -0
  96. /package/{examples → manual}/flake-shared.mjs +0 -0
  97. /package/{examples → manual}/no-provision.test.mjs +0 -0
  98. /package/{examples → manual}/scroll-until-text.test.mjs +0 -0
@@ -46,7 +46,7 @@ describe("Drag and Drop Test", () => {
46
46
 
47
47
  const recycleBin = await testdriver.find(
48
48
  "Recycle Bin, recycle bin icon in the top left corner of the desktop",
49
- );
49
+ ).hover();
50
50
  await recycleBin.mouseUp();
51
51
 
52
52
  // Assert "New Text Document" icon is not on the Desktop
@@ -0,0 +1,25 @@
1
+ import { describe, expect, it } from "vitest";
2
+ import { TestDriver } from "../lib/vitest/hooks.mjs";
3
+ import { getDefaults } from "../examples/config.mjs";
4
+
5
+ describe("Exec Log Streaming", () => {
6
+ it("should stream exec logs every second for 20 seconds", async (context) => {
7
+ const testdriver = TestDriver(context, { ...getDefaults(context), headless: true });
8
+ await testdriver.provision.chrome({ url: "about:blank" });
9
+
10
+ const code = `for i in $(seq 1 20); do echo "log line $i at $(date +%T)"; sleep 1; done`;
11
+
12
+ const result = await testdriver.exec({
13
+ language: "sh",
14
+ code,
15
+ timeout: 30000,
16
+ });
17
+
18
+ console.log("exec result:", result);
19
+
20
+ // Verify we got all 20 log lines
21
+ for (let i = 1; i <= 20; i++) {
22
+ expect(result).toContain(`log line ${i}`);
23
+ }
24
+ });
25
+ });
@@ -26,18 +26,33 @@ import { sessionManager } from "./session.js";
26
26
  const sdkRoot = path.join(path.dirname(fileURLToPath(import.meta.url)), "..", "..");
27
27
  const packageJson = JSON.parse(fs.readFileSync(path.join(sdkRoot, "package.json"), "utf-8"));
28
28
  const version = packageJson.version || "1.0.0";
29
- // Derive release channel from package version prerelease tag (e.g. "7.6.0-test.5" → "test")
29
+ // Derive release channel and infrastructure environment from package version
30
30
  import semver from "semver";
31
- const KNOWN_CHANNELS = new Set(["dev", "test", "canary", "latest"]);
32
- function resolveReleaseChannel(ver) {
33
- if (process.env.TD_CHANNEL && KNOWN_CHANNELS.has(process.env.TD_CHANNEL))
31
+ const CHANNEL_TO_ENV = {
32
+ dev: "dev",
33
+ test: "staging",
34
+ canary: "production",
35
+ stable: "production",
36
+ };
37
+ const VALID_CHANNELS = new Set(Object.keys(CHANNEL_TO_ENV));
38
+ const VALID_ENVS = new Set(["dev", "staging", "production"]);
39
+ function resolveChannel(ver) {
40
+ if (process.env.TD_CHANNEL && VALID_CHANNELS.has(process.env.TD_CHANNEL))
34
41
  return process.env.TD_CHANNEL;
42
+ if (process.env.TD_ENV && VALID_CHANNELS.has(process.env.TD_ENV))
43
+ return process.env.TD_ENV;
35
44
  const pre = semver.prerelease(ver);
36
- if (pre && pre.length > 0 && KNOWN_CHANNELS.has(String(pre[0])))
45
+ if (pre && pre.length > 0 && VALID_CHANNELS.has(String(pre[0])))
37
46
  return String(pre[0]);
38
- return "latest";
47
+ return "stable";
48
+ }
49
+ function resolveSentryEnvironment(ver) {
50
+ if (process.env.TD_ENV && VALID_ENVS.has(process.env.TD_ENV))
51
+ return process.env.TD_ENV;
52
+ return CHANNEL_TO_ENV[resolveChannel(ver)] || "production";
39
53
  }
40
- const releaseChannel = resolveReleaseChannel(version);
54
+ const activeChannel = resolveChannel(version);
55
+ const sentryEnvironment = resolveSentryEnvironment(version);
41
56
  const isSentryEnabled = () => {
42
57
  if (process.env.TD_TELEMETRY === "false") {
43
58
  return false;
@@ -49,7 +64,7 @@ if (isSentryEnabled()) {
49
64
  Sentry.init({
50
65
  dsn: process.env.SENTRY_DSN ||
51
66
  "https://452bd5a00dbd83a38ee8813e11c57694@o4510262629236736.ingest.us.sentry.io/4510480443637760",
52
- environment: releaseChannel,
67
+ environment: sentryEnvironment,
53
68
  release: version,
54
69
  sampleRate: 1.0,
55
70
  tracesSampleRate: 1.0,
@@ -57,6 +72,7 @@ if (isSentryEnabled()) {
57
72
  integrations: [Sentry.httpIntegration(), Sentry.nodeContextIntegration()],
58
73
  initialScope: {
59
74
  tags: {
75
+ channel: activeChannel,
60
76
  platform: os.platform(),
61
77
  arch: os.arch(),
62
78
  nodeVersion: process.version,
@@ -84,6 +100,10 @@ if (isSentryEnabled()) {
84
100
  if (error && typeof error === "object" && "name" in error && error.name === "TestFailure") {
85
101
  return null;
86
102
  }
103
+ // Filter out ElementNotFoundError - expected test outcome, not a crash
104
+ if (error && typeof error === "object" && "name" in error && error.name === "ElementNotFoundError") {
105
+ return null;
106
+ }
87
107
  return event;
88
108
  },
89
109
  });
@@ -34,16 +34,33 @@ const sdkRoot = path.join(path.dirname(fileURLToPath(import.meta.url)), "..", ".
34
34
  const packageJson = JSON.parse(fs.readFileSync(path.join(sdkRoot, "package.json"), "utf-8"));
35
35
  const version = packageJson.version || "1.0.0";
36
36
 
37
- // Derive release channel from package version prerelease tag (e.g. "7.6.0-test.5" → "test")
37
+ // Derive release channel and infrastructure environment from package version
38
38
  import semver from "semver";
39
- const KNOWN_CHANNELS = new Set(["dev", "test", "canary", "latest"]);
40
- function resolveReleaseChannel(ver: string): string {
41
- if (process.env.TD_CHANNEL && KNOWN_CHANNELS.has(process.env.TD_CHANNEL)) return process.env.TD_CHANNEL;
39
+
40
+ const CHANNEL_TO_ENV: Record<string, string> = {
41
+ dev: "dev",
42
+ test: "staging",
43
+ canary: "production",
44
+ stable: "production",
45
+ };
46
+ const VALID_CHANNELS = new Set(Object.keys(CHANNEL_TO_ENV));
47
+ const VALID_ENVS = new Set(["dev", "staging", "production"]);
48
+
49
+ function resolveChannel(ver: string): string {
50
+ if (process.env.TD_CHANNEL && VALID_CHANNELS.has(process.env.TD_CHANNEL)) return process.env.TD_CHANNEL;
51
+ if (process.env.TD_ENV && VALID_CHANNELS.has(process.env.TD_ENV)) return process.env.TD_ENV;
42
52
  const pre = semver.prerelease(ver);
43
- if (pre && pre.length > 0 && KNOWN_CHANNELS.has(String(pre[0]))) return String(pre[0]);
44
- return "latest";
53
+ if (pre && pre.length > 0 && VALID_CHANNELS.has(String(pre[0]))) return String(pre[0]);
54
+ return "stable";
55
+ }
56
+
57
+ function resolveSentryEnvironment(ver: string): string {
58
+ if (process.env.TD_ENV && VALID_ENVS.has(process.env.TD_ENV)) return process.env.TD_ENV;
59
+ return CHANNEL_TO_ENV[resolveChannel(ver)] || "production";
45
60
  }
46
- const releaseChannel = resolveReleaseChannel(version);
61
+
62
+ const activeChannel = resolveChannel(version);
63
+ const sentryEnvironment = resolveSentryEnvironment(version);
47
64
 
48
65
  const isSentryEnabled = () => {
49
66
  if (process.env.TD_TELEMETRY === "false") {
@@ -58,7 +75,7 @@ if (isSentryEnabled()) {
58
75
  dsn:
59
76
  process.env.SENTRY_DSN ||
60
77
  "https://452bd5a00dbd83a38ee8813e11c57694@o4510262629236736.ingest.us.sentry.io/4510480443637760",
61
- environment: releaseChannel,
78
+ environment: sentryEnvironment,
62
79
  release: version,
63
80
  sampleRate: 1.0,
64
81
  tracesSampleRate: 1.0,
@@ -66,6 +83,7 @@ if (isSentryEnabled()) {
66
83
  integrations: [Sentry.httpIntegration(), Sentry.nodeContextIntegration()],
67
84
  initialScope: {
68
85
  tags: {
86
+ channel: activeChannel,
69
87
  platform: os.platform(),
70
88
  arch: os.arch(),
71
89
  nodeVersion: process.version,
@@ -99,6 +117,11 @@ if (isSentryEnabled()) {
99
117
  if (error && typeof error === "object" && "name" in error && (error as { name: string }).name === "TestFailure") {
100
118
  return null;
101
119
  }
120
+
121
+ // Filter out ElementNotFoundError - expected test outcome, not a crash
122
+ if (error && typeof error === "object" && "name" in error && (error as { name: string }).name === "ElementNotFoundError") {
123
+ return null;
124
+ }
102
125
 
103
126
  return event;
104
127
  },
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "testdriverai",
3
- "version": "7.8.0-test.7",
3
+ "version": "7.8.0-test.71",
4
4
  "description": "Next generation autonomous AI agent for end-to-end testing of web & desktop",
5
5
  "main": "sdk.js",
6
6
  "types": "sdk.d.ts",
@@ -37,8 +37,8 @@
37
37
  "start": "node bin/testdriverai.js",
38
38
  "dev": "DEV=true node bin/testdriverai.js",
39
39
  "debug": "DEV=true VERBOSE=true node bin/testdriverai.js",
40
- "docs": "npm run docs:skills && cd docs && npx mint@latest dev",
41
- "docs:dev": "cd docs && npx mint dev",
40
+ "docs": "npm run docs:skills && cd docs && npx mint@latest dev --port 3002",
41
+ "docs:dev": "cd docs && npx mint dev --port 3002",
42
42
  "docs:build": "npm run docs:skills && cd docs && npx mint@latest build",
43
43
  "docs:links": "node docs/_scripts/link-replacer.js",
44
44
  "docs:skills": "node docs/_scripts/generate-skills.js",
@@ -116,6 +116,7 @@
116
116
  },
117
117
  "overrides": {
118
118
  "glob": "^11.0.1",
119
+ "obug": "2.1.0",
119
120
  "rimraf": "^5.0.10"
120
121
  },
121
122
  "peerDependencies": {
package/sdk.d.ts CHANGED
@@ -273,6 +273,8 @@ export interface TestDriverOptions {
273
273
  sandboxAmi?: string;
274
274
  /** EC2 instance type for sandbox (e.g., 'i3.metal') */
275
275
  sandboxInstance?: string;
276
+ /** E2B template ID to use when creating the sandbox (e.g., 'my-template-id') */
277
+ e2bTemplateId?: string;
276
278
  /** Cache key for element finding operations. If provided, enables caching tied to this key */
277
279
  cacheKey?: string;
278
280
  /** Reconnect to the last used sandbox instead of creating a new one. When true, provision methods (chrome, vscode, installer, etc.) will be skipped since the application is already running. Throws error if no previous sandbox exists. */
@@ -327,6 +329,8 @@ export interface ConnectOptions {
327
329
  sandboxAmi?: string;
328
330
  /** EC2 instance type for sandbox (e.g., 'i3.metal') */
329
331
  sandboxInstance?: string;
332
+ /** E2B template ID to use when creating the sandbox (e.g., 'my-template-id') */
333
+ e2bTemplateId?: string;
330
334
  /** Operating system for the sandbox (default: 'linux') */
331
335
  os?: "windows" | "linux";
332
336
  /**
package/sdk.js CHANGED
@@ -481,7 +481,7 @@ class Element {
481
481
  let cacheKey = null;
482
482
  let cacheThreshold = null;
483
483
  let perCommandThresholds = null; // Per-command { screen, element } override
484
- let zoom = false; // Default to disabled, enable with zoom: true
484
+ let zoom = true; // Default to enabled
485
485
  let perCommandAi = null; // Per-command AI config override
486
486
 
487
487
  let minConfidence = null; // Minimum confidence threshold
@@ -494,8 +494,8 @@ class Element {
494
494
  // New: options is an object with cacheKey and/or cacheThreshold
495
495
  cacheKey = options.cacheKey || null;
496
496
  cacheThreshold = options.cacheThreshold ?? null;
497
- // zoom defaults to false unless explicitly set to true
498
- zoom = options.zoom === true;
497
+ // zoom defaults to true unless explicitly set to false
498
+ zoom = options.zoom !== false;
499
499
  // Minimum confidence threshold: fail find if AI confidence is below this value
500
500
  minConfidence = options.confidence ?? null;
501
501
  // Element type hint for prompt wrapping
@@ -568,7 +568,7 @@ class Element {
568
568
  cacheKey: cacheKey,
569
569
  os: this.sdk.os,
570
570
  resolution: this.sdk.resolution,
571
- zoom: zoom,
571
+ zoom: zoom === true ? 1 : zoom === false ? 0 : zoom,
572
572
  confidence: minConfidence,
573
573
  type: elementType,
574
574
  ai: {
@@ -623,6 +623,11 @@ class Element {
623
623
 
624
624
  // Track find interaction once at the end (fire-and-forget, don't block)
625
625
  const sessionId = this.sdk.getSessionId();
626
+ const findCacheHit = response?.cacheHit || response?.cache_hit || response?.cached || false;
627
+ // Increment local interaction counters
628
+ this.sdk._interactionStats.total++;
629
+ this.sdk._interactionStats.byType.find = (this.sdk._interactionStats.byType.find || 0) + 1;
630
+ if (findCacheHit) this.sdk._interactionStats.cached++;
626
631
  if (sessionId && this.sdk.apiClient) {
627
632
  this.sdk.apiClient
628
633
  .req("interaction/track", {
@@ -632,11 +637,7 @@ class Element {
632
637
  timestamp: absoluteTimestamp, // Absolute epoch timestamp - frontend calculates relative using clientStartDate
633
638
  success: this._found,
634
639
  error: findError,
635
- cacheHit:
636
- response?.cacheHit ||
637
- response?.cache_hit ||
638
- response?.cached ||
639
- false,
640
+ cacheHit: findCacheHit,
640
641
  selector: response?.selector,
641
642
  selectorUsed: !!response?.selector,
642
643
  confidence: response?.confidence ?? null,
@@ -1498,6 +1499,7 @@ class TestDriverSDK {
1498
1499
  // Store sandbox configuration options
1499
1500
  this.sandboxAmi = options.sandboxAmi || null;
1500
1501
  this.sandboxInstance = options.sandboxInstance || null;
1502
+ this.e2bTemplateId = options.e2bTemplateId || null;
1501
1503
 
1502
1504
  // Store reconnect preference from options
1503
1505
  this.reconnect =
@@ -1616,6 +1618,12 @@ class TestDriverSDK {
1616
1618
  // Uploaded to S3 at cleanup so they can be displayed alongside dashcam replays.
1617
1619
  this._logBuffer = [];
1618
1620
 
1621
+ // API version discovered by _logEnvironmentInfo()
1622
+ this._apiVersion = null;
1623
+
1624
+ // Local interaction counters — incremented at each interaction/track call site
1625
+ this._interactionStats = { total: 0, cached: 0, byType: {} };
1626
+
1619
1627
  // Set up event listeners once (they live for the lifetime of the SDK instance)
1620
1628
  this._setupLogging();
1621
1629
 
@@ -2716,6 +2724,7 @@ CAPTCHA_SOLVER_EOF`,
2716
2724
  * @param {string} options.ip - Direct IP address to connect to
2717
2725
  * @param {string} options.sandboxAmi - AMI to use for the sandbox
2718
2726
  * @param {string} options.sandboxInstance - Instance type for the sandbox
2727
+ * @param {string} options.e2bTemplateId - E2B template ID to use when creating the sandbox
2719
2728
  * @param {string} options.os - Operating system for the sandbox (windows or linux)
2720
2729
  * @param {boolean} options.reuseConnection - Reuse recent connection if available (default: true)
2721
2730
  * @returns {Promise<Object>} Sandbox instance details
@@ -2749,6 +2758,9 @@ CAPTCHA_SOLVER_EOF`,
2749
2758
  }
2750
2759
  }
2751
2760
 
2761
+ // Log environment info immediately so it's visible even if auth fails
2762
+ this._logEnvironmentInfo();
2763
+
2752
2764
  // Authenticate first if not already authenticated
2753
2765
  if (!this.authenticated) {
2754
2766
  await this.auth();
@@ -2801,6 +2813,12 @@ CAPTCHA_SOLVER_EOF`,
2801
2813
  } else if (this.sandboxInstance) {
2802
2814
  this.agent.sandboxInstance = this.sandboxInstance;
2803
2815
  }
2816
+ // Use e2bTemplateId from connectOptions if provided, otherwise fall back to constructor value
2817
+ if (connectOptions.e2bTemplateId !== undefined) {
2818
+ this.agent.e2bTemplateId = connectOptions.e2bTemplateId;
2819
+ } else if (this.e2bTemplateId) {
2820
+ this.agent.e2bTemplateId = this.e2bTemplateId;
2821
+ }
2804
2822
  // Use os from connectOptions if provided, otherwise fall back to this.os
2805
2823
  if (connectOptions.os !== undefined) {
2806
2824
  this.agent.sandboxOs = connectOptions.os;
@@ -2865,9 +2883,6 @@ CAPTCHA_SOLVER_EOF`,
2865
2883
  sandboxId: this.instance?.instanceId,
2866
2884
  });
2867
2885
 
2868
- // Log environment info (non-blocking, skip on stable)
2869
- this._logEnvironmentInfo();
2870
-
2871
2886
  return this.instance;
2872
2887
  }
2873
2888
 
@@ -3193,6 +3208,11 @@ CAPTCHA_SOLVER_EOF`,
3193
3208
 
3194
3209
  // Track successful findAll interaction (fire-and-forget, don't block)
3195
3210
  const sessionId = this.getSessionId();
3211
+ const findAllCacheHit = response.cached || false;
3212
+ // Increment local interaction counters
3213
+ this._interactionStats.total++;
3214
+ this._interactionStats.byType.findAll = (this._interactionStats.byType.findAll || 0) + 1;
3215
+ if (findAllCacheHit) this._interactionStats.cached++;
3196
3216
  if (sessionId && this.apiClient) {
3197
3217
  this.apiClient
3198
3218
  .req("interaction/track", {
@@ -3202,7 +3222,7 @@ CAPTCHA_SOLVER_EOF`,
3202
3222
  timestamp: absoluteTimestamp, // Absolute epoch timestamp - frontend calculates relative using clientStartDate
3203
3223
  success: true,
3204
3224
  input: { count: elements.length },
3205
- cacheHit: response.cached || false,
3225
+ cacheHit: findAllCacheHit,
3206
3226
  selector: response.selector,
3207
3227
  selectorUsed: !!response.selector,
3208
3228
  screenshotUrl: response.screenshotKey ?? null,
@@ -3248,6 +3268,11 @@ CAPTCHA_SOLVER_EOF`,
3248
3268
 
3249
3269
  // No elements found - track interaction (fire-and-forget, don't block)
3250
3270
  const sessionId = this.getSessionId();
3271
+ const noResultCacheHit = response?.cached || false;
3272
+ // Increment local interaction counters
3273
+ this._interactionStats.total++;
3274
+ this._interactionStats.byType.findAll = (this._interactionStats.byType.findAll || 0) + 1;
3275
+ if (noResultCacheHit) this._interactionStats.cached++;
3251
3276
  if (sessionId && this.apiClient) {
3252
3277
  this.apiClient
3253
3278
  .req("interaction/track", {
@@ -3258,7 +3283,7 @@ CAPTCHA_SOLVER_EOF`,
3258
3283
  success: false,
3259
3284
  error: "No elements found",
3260
3285
  input: { count: 0 },
3261
- cacheHit: response?.cached || false,
3286
+ cacheHit: noResultCacheHit,
3262
3287
  selector: response?.selector,
3263
3288
  selectorUsed: !!response?.selector,
3264
3289
  screenshotUrl: response?.screenshotKey ?? null,
@@ -3292,6 +3317,9 @@ CAPTCHA_SOLVER_EOF`,
3292
3317
 
3293
3318
  // Track findAll error interaction (fire-and-forget, don't block)
3294
3319
  const sessionId = this.getSessionId();
3320
+ // Increment local interaction counters
3321
+ this._interactionStats.total++;
3322
+ this._interactionStats.byType.findAll = (this._interactionStats.byType.findAll || 0) + 1;
3295
3323
  if (sessionId && this.apiClient) {
3296
3324
  this.apiClient
3297
3325
  .req("interaction/track", {
@@ -3817,7 +3845,7 @@ CAPTCHA_SOLVER_EOF`,
3817
3845
  const apiRoot = this.config?.TD_API_ROOT || 'unknown';
3818
3846
  const apiKey = this.config?.TD_API_KEY || '';
3819
3847
  const maskedKey = apiKey.length > 4 ? '***' + apiKey.slice(-4) : '(not set)';
3820
- const env = process.env.TD_ENV || 'unknown';
3848
+ const env = process.env.TD_CHANNEL || process.env.TD_ENV || 'unknown';
3821
3849
  const os = this.agent?.options?.os || process.env.TD_OS || 'linux';
3822
3850
  const sdkVersion = require('./package.json').version;
3823
3851
 
@@ -3843,6 +3871,8 @@ CAPTCHA_SOLVER_EOF`,
3843
3871
  res.on('end', () => {
3844
3872
  try {
3845
3873
  const info = JSON.parse(data);
3874
+ // Persist API version for test result metadata
3875
+ this._apiVersion = info.version || null;
3846
3876
  const commit = info.commit || 'unknown';
3847
3877
  const shortCommit = commit.substring(0, 7);
3848
3878
  const commitUrl = commit !== 'unknown'
@@ -0,0 +1,79 @@
1
+ #!/usr/bin/env bash
2
+ set -euo pipefail
3
+
4
+ # Usage: ./install-dev-runner.sh <instance-id>
5
+ INSTANCE_ID="${1:?Usage: $0 <instance-id>}"
6
+ AWS_REGION="${AWS_REGION:-us-east-2}"
7
+
8
+ RUNNER_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/../../../runner" && pwd)"
9
+
10
+ echo "Packing local runner..."
11
+ TMPDIR=$(mktemp -d)
12
+ pushd "$RUNNER_DIR" > /dev/null
13
+ npm pack --pack-destination "$TMPDIR" > /dev/null 2>&1
14
+ TARBALL=$(ls "$TMPDIR"/*.tgz)
15
+ popd > /dev/null
16
+ echo "Tarball: $TARBALL"
17
+
18
+ echo "Uploading to S3..."
19
+ S3_KEY="runner-dev/$(date +%s)-$(openssl rand -hex 4)/runner.tgz"
20
+ aws s3 cp "$TARBALL" "s3://v7-transfer/${S3_KEY}" --region "$AWS_REGION" > /dev/null
21
+ DOWNLOAD_URL=$(aws s3 presign "s3://v7-transfer/${S3_KEY}" --expires-in 900 --region "$AWS_REGION")
22
+ rm -rf "$TMPDIR"
23
+
24
+ echo "Creating SSM params file..."
25
+
26
+ # Write Python script to temp file to generate valid JSON
27
+ PYTHON_SCRIPT=$(mktemp --suffix=.py)
28
+ cat > "$PYTHON_SCRIPT" << 'PYEOF'
29
+ import json
30
+ import sys
31
+
32
+ url = sys.argv[1]
33
+
34
+ commands = [
35
+ "Write-Host '=== Stopping runner ==='",
36
+ "Stop-ScheduledTask -TaskName RunTestDriverAgent -ErrorAction SilentlyContinue",
37
+ "Stop-Process -Name node -Force -ErrorAction SilentlyContinue",
38
+ "Start-Sleep -Seconds 2",
39
+ "Set-Location 'C:\\testdriver\\sandbox-agent'",
40
+ "$tarball = 'C:\\Windows\\Temp\\runner-dev.tgz'",
41
+ f"Invoke-WebRequest -Uri '{url}' -OutFile $tarball",
42
+ "Write-Host 'Tarball size:'; (Get-Item $tarball).Length",
43
+ "Remove-Item -Path lib -Recurse -Force -ErrorAction SilentlyContinue",
44
+ "tar -xzf $tarball --strip-components=1 -C .",
45
+ "Get-Content 'package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
46
+ "Write-Host '=== Starting runner ==='",
47
+ "Start-ScheduledTask -TaskName RunTestDriverAgent",
48
+ "Start-Sleep -Seconds 3",
49
+ "Get-Content 'C:\\testdriver\\log.txt' -Tail 20"
50
+ ]
51
+
52
+ params = {"commands": commands}
53
+ print(json.dumps(params))
54
+ PYEOF
55
+
56
+ python3 "$PYTHON_SCRIPT" "$DOWNLOAD_URL" > /tmp/ssm-install-params.json
57
+ rm "$PYTHON_SCRIPT"
58
+
59
+ echo "Sending SSM command..."
60
+ CMD_JSON=$(aws ssm send-command \
61
+ --region "$AWS_REGION" \
62
+ --instance-ids "$INSTANCE_ID" \
63
+ --document-name "AWS-RunPowerShellScript" \
64
+ --parameters "file:///tmp/ssm-install-params.json" \
65
+ --output json)
66
+
67
+ COMMAND_ID=$(echo "$CMD_JSON" | jq -r '.Command.CommandId')
68
+ echo "Command ID: $COMMAND_ID"
69
+
70
+ echo "Waiting for completion..."
71
+ aws ssm wait command-executed --region "$AWS_REGION" --command-id "$COMMAND_ID" --instance-id "$INSTANCE_ID" || true
72
+
73
+ echo "Getting output..."
74
+ aws ssm get-command-invocation \
75
+ --region "$AWS_REGION" \
76
+ --command-id "$COMMAND_ID" \
77
+ --instance-id "$INSTANCE_ID" \
78
+ --query 'StandardOutputContent' \
79
+ --output text
@@ -141,6 +141,171 @@ while :; do
141
141
  sleep 20
142
142
  done
143
143
 
144
+ # --- 4) Install/update runner ---
145
+ echo "Installing runner..."
146
+
147
+ # Determine environment and version
148
+ TD_CHANNEL="${TD_CHANNEL:-stable}"
149
+ SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
150
+ SDK_PKG_JSON="${SCRIPT_DIR}/../../../sdk/package.json"
151
+ RUNNER_DIR="${SCRIPT_DIR}/../../../runner"
152
+
153
+ if [ -f "$SDK_PKG_JSON" ]; then
154
+ RUNNER_VERSION=$(jq -r '.version' "$SDK_PKG_JSON")
155
+ echo "Runner version from SDK: $RUNNER_VERSION"
156
+ else
157
+ RUNNER_VERSION="$TD_CHANNEL"
158
+ echo "SDK package.json not found, using env tag: $RUNNER_VERSION"
159
+ fi
160
+
161
+ if [ "$TD_CHANNEL" = "dev" ]; then
162
+ echo "Dev mode: packing and uploading local runner to S3..."
163
+
164
+ # Pack local runner
165
+ TMPDIR=$(mktemp -d)
166
+ pushd "$RUNNER_DIR" > /dev/null
167
+ npm pack --pack-destination "$TMPDIR" > /dev/null 2>&1
168
+ TARBALL=$(ls "$TMPDIR"/*.tgz | head -1)
169
+ popd > /dev/null
170
+
171
+ # Upload to S3
172
+ S3_BUCKET="${AWS_BUCKET_IMAGE_TRANSFER:-v7-transfer}"
173
+ S3_KEY="runner-dev/$(date +%s)-$(openssl rand -hex 4)/runner.tgz"
174
+ aws s3 cp "$TARBALL" "s3://${S3_BUCKET}/${S3_KEY}" --region "$AWS_REGION"
175
+
176
+ # Generate presigned URL (15 min)
177
+ DOWNLOAD_URL=$(aws s3 presign "s3://${S3_BUCKET}/${S3_KEY}" --expires-in 900 --region "$AWS_REGION")
178
+ rm -rf "$TMPDIR"
179
+
180
+ # Build SSM parameters JSON in a temp file to avoid shell escaping issues with URL
181
+ PARAMS_FILE=$(mktemp)
182
+ cat > "$PARAMS_FILE" << 'PARAMS_EOF'
183
+ {
184
+ "commands": [
185
+ "Write-Host '=== Starting runner dev install ==='",
186
+ "Write-Host 'Stopping existing runner processes...'",
187
+ "Stop-ScheduledTask -TaskName RunTestDriverAgent -ErrorAction SilentlyContinue",
188
+ "Stop-Process -Name node -Force -ErrorAction SilentlyContinue",
189
+ "Start-Sleep -Seconds 2",
190
+ "Write-Host 'Current runner version:'",
191
+ "Get-Content 'C:\\testdriver\\sandbox-agent\\package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
192
+ "Set-Location 'C:\\testdriver\\sandbox-agent'",
193
+ "Write-Host 'Dev mode: downloading runner from S3...'",
194
+ "$tarball = 'C:\\Windows\\Temp\\runner-dev.tgz'",
195
+ PARAMS_EOF
196
+
197
+ # Add the URL line with proper JSON escaping
198
+ echo " \"Invoke-WebRequest -Uri '$(echo "$DOWNLOAD_URL" | sed 's/"/\\"/g')' -OutFile \$tarball\"," >> "$PARAMS_FILE"
199
+
200
+ cat >> "$PARAMS_FILE" << 'PARAMS_EOF'
201
+ "Write-Host 'Downloaded tarball size:'",
202
+ "(Get-Item $tarball).Length",
203
+ "Write-Host 'Extracting runner...'",
204
+ "tar -xzf $tarball -C 'C:\\Windows\\Temp'",
205
+ "Write-Host 'Extracted package contents:'",
206
+ "Get-ChildItem 'C:\\Windows\\Temp\\package' -Recurse | Select-Object FullName",
207
+ "Write-Host 'New runner version in package:'",
208
+ "Get-Content 'C:\\Windows\\Temp\\package\\package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
209
+ "Write-Host 'Clearing old lib folder...'",
210
+ "Remove-Item 'C:\\testdriver\\sandbox-agent\\lib' -Recurse -Force -ErrorAction SilentlyContinue",
211
+ "Write-Host 'Copying files to sandbox-agent...'",
212
+ "xcopy 'C:\\Windows\\Temp\\package\\*' 'C:\\testdriver\\sandbox-agent\\' /E /Y /I",
213
+ "Write-Host 'Files after copy:'",
214
+ "Get-ChildItem 'C:\\testdriver\\sandbox-agent' | Select-Object Name",
215
+ "Remove-Item 'C:\\Windows\\Temp\\package' -Recurse -Force -ErrorAction SilentlyContinue",
216
+ "Remove-Item $tarball -Force -ErrorAction SilentlyContinue",
217
+ "Write-Host 'Runner version after copy:'",
218
+ "Get-Content 'C:\\testdriver\\sandbox-agent\\package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
219
+ "Write-Host 'Installing npm dependencies...'",
220
+ "npm install --omit=dev 2>&1 | Write-Host",
221
+ "Write-Host 'Final verification - ably-service.js exists:'",
222
+ "Test-Path 'C:\\testdriver\\sandbox-agent\\lib\\ably-service.js'",
223
+ "Write-Host 'Restarting RunTestDriverAgent scheduled task...'",
224
+ "Start-ScheduledTask -TaskName RunTestDriverAgent -ErrorAction SilentlyContinue",
225
+ "Write-Host '=== Runner install complete (dev) ==='"
226
+ ]
227
+ }
228
+ PARAMS_EOF
229
+
230
+ echo "Sending SSM command to download and install runner from S3..."
231
+ INSTALL_CMD=$(aws ssm send-command \
232
+ --region "$AWS_REGION" \
233
+ --instance-ids "$INSTANCE_ID" \
234
+ --document-name "AWS-RunPowerShellScript" \
235
+ --parameters "file://$PARAMS_FILE" \
236
+ --timeout-seconds 180 \
237
+ --output json)
238
+ rm -f "$PARAMS_FILE"
239
+ else
240
+ echo "Installing @testdriverai/runner@${RUNNER_VERSION} via npm pack + extract..."
241
+
242
+ # Build SSM parameters JSON in a temp file (same approach as dev mode)
243
+ PARAMS_FILE=$(mktemp)
244
+ cat > "$PARAMS_FILE" << PARAMS_EOF
245
+ {
246
+ "commands": [
247
+ "Write-Host '=== Starting runner install (npm pack) ==='",
248
+ "Write-Host 'Stopping existing runner processes...'",
249
+ "Stop-ScheduledTask -TaskName RunTestDriverAgent -ErrorAction SilentlyContinue",
250
+ "Stop-Process -Name node -Force -ErrorAction SilentlyContinue",
251
+ "Start-Sleep -Seconds 2",
252
+ "Write-Host 'Current runner version:'",
253
+ "Get-Content 'C:\\\\testdriver\\\\sandbox-agent\\\\package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
254
+ "Set-Location 'C:\\\\Windows\\\\Temp'",
255
+ "Write-Host 'Downloading @testdriverai/runner@${RUNNER_VERSION} via npm pack...'",
256
+ "npm pack @testdriverai/runner@${RUNNER_VERSION} 2>&1 | Write-Host",
257
+ "\$tarball = (Get-ChildItem 'C:\\\\Windows\\\\Temp\\\\testdriverai-runner-*.tgz' | Sort-Object LastWriteTime -Descending | Select-Object -First 1).FullName",
258
+ "Write-Host \"Downloaded tarball: \$tarball\"",
259
+ "Write-Host 'Extracting runner...'",
260
+ "tar -xzf \$tarball -C 'C:\\\\Windows\\\\Temp'",
261
+ "Write-Host 'New runner version in package:'",
262
+ "Get-Content 'C:\\\\Windows\\\\Temp\\\\package\\\\package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
263
+ "Write-Host 'Clearing old lib folder...'",
264
+ "Remove-Item 'C:\\\\testdriver\\\\sandbox-agent\\\\lib' -Recurse -Force -ErrorAction SilentlyContinue",
265
+ "Write-Host 'Copying files to sandbox-agent...'",
266
+ "xcopy 'C:\\\\Windows\\\\Temp\\\\package\\\\*' 'C:\\\\testdriver\\\\sandbox-agent\\\\' /E /Y /I",
267
+ "Write-Host 'Runner version after copy:'",
268
+ "Get-Content 'C:\\\\testdriver\\\\sandbox-agent\\\\package.json' | ConvertFrom-Json | Select-Object -ExpandProperty version",
269
+ "Remove-Item 'C:\\\\Windows\\\\Temp\\\\package' -Recurse -Force -ErrorAction SilentlyContinue",
270
+ "Remove-Item \$tarball -Force -ErrorAction SilentlyContinue",
271
+ "Set-Location 'C:\\\\testdriver\\\\sandbox-agent'",
272
+ "Write-Host 'Installing npm dependencies...'",
273
+ "npm install --omit=dev 2>&1 | Write-Host",
274
+ "Write-Host 'Restarting RunTestDriverAgent scheduled task...'",
275
+ "Start-ScheduledTask -TaskName RunTestDriverAgent -ErrorAction SilentlyContinue",
276
+ "Write-Host '=== Runner install complete (npm pack) ==='"
277
+ ]
278
+ }
279
+ PARAMS_EOF
280
+
281
+ INSTALL_CMD=$(aws ssm send-command \
282
+ --region "$AWS_REGION" \
283
+ --instance-ids "$INSTANCE_ID" \
284
+ --document-name "AWS-RunPowerShellScript" \
285
+ --parameters "file://$PARAMS_FILE" \
286
+ --timeout-seconds 180 \
287
+ --output json)
288
+ rm -f "$PARAMS_FILE"
289
+ fi
290
+
291
+ INSTALL_CMD_ID=$(jq -r '.Command.CommandId' <<<"$INSTALL_CMD")
292
+ echo "Runner install command sent (Command ID: $INSTALL_CMD_ID)"
293
+
294
+ # Wait for install to complete
295
+ echo "Waiting for runner install to complete..."
296
+ if aws ssm wait command-executed --region "$AWS_REGION" --command-id "$INSTALL_CMD_ID" --instance-id "$INSTANCE_ID" 2>/dev/null; then
297
+ echo "✓ Runner install succeeded"
298
+ else
299
+ INSTALL_STATUS=$(aws ssm get-command-invocation \
300
+ --region "$AWS_REGION" \
301
+ --command-id "$INSTALL_CMD_ID" \
302
+ --instance-id "$INSTANCE_ID" \
303
+ --output json 2>/dev/null || echo '{}')
304
+ echo "⚠ Runner install status: $(jq -r '.Status // "Unknown"' <<<"$INSTALL_STATUS")"
305
+ echo "Output: $(jq -r '.StandardOutputContent // "No output"' <<<"$INSTALL_STATUS" | head -20)"
306
+ echo "Errors: $(jq -r '.StandardErrorContent // "No errors"' <<<"$INSTALL_STATUS" | head -10)"
307
+ fi
308
+
144
309
  echo "Getting Public IP..."
145
310
 
146
311
  # --- 5) Get instance Public IP ---