agent-browser-stealth 0.14.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (77) hide show
  1. package/LICENSE +201 -0
  2. package/README.md +1219 -0
  3. package/bin/agent-browser-darwin-arm64 +0 -0
  4. package/bin/agent-browser-local +0 -0
  5. package/bin/agent-browser.js +109 -0
  6. package/dist/actions.d.ts +17 -0
  7. package/dist/actions.d.ts.map +1 -0
  8. package/dist/actions.js +1917 -0
  9. package/dist/actions.js.map +1 -0
  10. package/dist/browser.d.ts +598 -0
  11. package/dist/browser.d.ts.map +1 -0
  12. package/dist/browser.js +2287 -0
  13. package/dist/browser.js.map +1 -0
  14. package/dist/daemon.d.ts +66 -0
  15. package/dist/daemon.d.ts.map +1 -0
  16. package/dist/daemon.js +603 -0
  17. package/dist/daemon.js.map +1 -0
  18. package/dist/diff.d.ts +18 -0
  19. package/dist/diff.d.ts.map +1 -0
  20. package/dist/diff.js +271 -0
  21. package/dist/diff.js.map +1 -0
  22. package/dist/encryption.d.ts +50 -0
  23. package/dist/encryption.d.ts.map +1 -0
  24. package/dist/encryption.js +85 -0
  25. package/dist/encryption.js.map +1 -0
  26. package/dist/ios-actions.d.ts +11 -0
  27. package/dist/ios-actions.d.ts.map +1 -0
  28. package/dist/ios-actions.js +228 -0
  29. package/dist/ios-actions.js.map +1 -0
  30. package/dist/ios-manager.d.ts +266 -0
  31. package/dist/ios-manager.d.ts.map +1 -0
  32. package/dist/ios-manager.js +1073 -0
  33. package/dist/ios-manager.js.map +1 -0
  34. package/dist/protocol.d.ts +26 -0
  35. package/dist/protocol.d.ts.map +1 -0
  36. package/dist/protocol.js +935 -0
  37. package/dist/protocol.js.map +1 -0
  38. package/dist/snapshot.d.ts +67 -0
  39. package/dist/snapshot.d.ts.map +1 -0
  40. package/dist/snapshot.js +514 -0
  41. package/dist/snapshot.js.map +1 -0
  42. package/dist/state-utils.d.ts +77 -0
  43. package/dist/state-utils.d.ts.map +1 -0
  44. package/dist/state-utils.js +178 -0
  45. package/dist/state-utils.js.map +1 -0
  46. package/dist/stealth.d.ts +22 -0
  47. package/dist/stealth.d.ts.map +1 -0
  48. package/dist/stealth.js +614 -0
  49. package/dist/stealth.js.map +1 -0
  50. package/dist/stream-server.d.ts +117 -0
  51. package/dist/stream-server.d.ts.map +1 -0
  52. package/dist/stream-server.js +309 -0
  53. package/dist/stream-server.js.map +1 -0
  54. package/dist/types.d.ts +855 -0
  55. package/dist/types.d.ts.map +1 -0
  56. package/dist/types.js +2 -0
  57. package/dist/types.js.map +1 -0
  58. package/package.json +85 -0
  59. package/scripts/build-all-platforms.sh +68 -0
  60. package/scripts/check-creepjs-headless.js +137 -0
  61. package/scripts/check-sannysoft-webdriver.js +112 -0
  62. package/scripts/check-version-sync.js +39 -0
  63. package/scripts/copy-native.js +36 -0
  64. package/scripts/postinstall.js +275 -0
  65. package/scripts/sync-upstream.sh +142 -0
  66. package/scripts/sync-version.js +69 -0
  67. package/skills/agent-browser/SKILL.md +464 -0
  68. package/skills/agent-browser/references/authentication.md +202 -0
  69. package/skills/agent-browser/references/commands.md +263 -0
  70. package/skills/agent-browser/references/profiling.md +120 -0
  71. package/skills/agent-browser/references/proxy-support.md +194 -0
  72. package/skills/agent-browser/references/session-management.md +193 -0
  73. package/skills/agent-browser/references/snapshot-refs.md +194 -0
  74. package/skills/agent-browser/references/video-recording.md +173 -0
  75. package/skills/agent-browser/templates/authenticated-session.sh +100 -0
  76. package/skills/agent-browser/templates/capture-workflow.sh +69 -0
  77. package/skills/agent-browser/templates/form-automation.sh +62 -0
@@ -0,0 +1,1917 @@
1
+ import * as fs from 'fs';
2
+ import * as path from 'path';
3
+ import { mkdirSync } from 'node:fs';
4
+ import { getAppDir } from './daemon.js';
5
+ import { getSessionsDir, readStateFile, isValidSessionName, isEncryptedPayload, listStateFiles, cleanupExpiredStates, } from './state-utils.js';
6
+ import { successResponse, errorResponse } from './protocol.js';
7
+ import { diffSnapshots, diffScreenshots } from './diff.js';
8
+ import { getEnhancedSnapshot } from './snapshot.js';
9
+ // Callback for screencast frames - will be set by the daemon when streaming is active
10
+ let screencastFrameCallback = null;
11
+ /**
12
+ * Set the callback for screencast frames
13
+ * This is called by the daemon to set up frame streaming
14
+ */
15
+ export function setScreencastFrameCallback(callback) {
16
+ screencastFrameCallback = callback;
17
+ }
18
+ /**
19
+ * Convert Playwright errors to AI-friendly messages
20
+ * @internal Exported for testing
21
+ */
22
+ export function toAIFriendlyError(error, selector) {
23
+ const message = error instanceof Error ? error.message : String(error);
24
+ // Handle strict mode violation (multiple elements match)
25
+ if (message.includes('strict mode violation')) {
26
+ // Extract count if available
27
+ const countMatch = message.match(/resolved to (\d+) elements/);
28
+ const count = countMatch ? countMatch[1] : 'multiple';
29
+ return new Error(`Selector "${selector}" matched ${count} elements. ` +
30
+ `Run 'snapshot' to get updated refs, or use a more specific CSS selector.`);
31
+ }
32
+ // Handle element not interactable (must be checked BEFORE timeout case)
33
+ // This includes cases where an overlay/modal blocks the element
34
+ if (message.includes('intercepts pointer events')) {
35
+ return new Error(`Element "${selector}" is blocked by another element (likely a modal or overlay). ` +
36
+ `Try dismissing any modals/cookie banners first.`);
37
+ }
38
+ // Handle element not visible
39
+ if (message.includes('not visible') && !message.includes('Timeout')) {
40
+ return new Error(`Element "${selector}" is not visible. ` +
41
+ `Try scrolling it into view or check if it's hidden.`);
42
+ }
43
+ // Handle general timeout (element exists but action couldn't complete)
44
+ if (message.includes('Timeout') && message.includes('exceeded')) {
45
+ return new Error(`Action on "${selector}" timed out. The element may be blocked, still loading, or not interactable. ` +
46
+ `Run 'snapshot' to check the current page state.`);
47
+ }
48
+ // Handle element not found (timeout waiting for element)
49
+ if (message.includes('waiting for') &&
50
+ (message.includes('to be visible') || message.includes('Timeout'))) {
51
+ return new Error(`Element "${selector}" not found or not visible. ` +
52
+ `Run 'snapshot' to see current page elements.`);
53
+ }
54
+ // Return original error for unknown cases
55
+ return error instanceof Error ? error : new Error(message);
56
+ }
57
+ /**
58
+ * Execute a command and return a response
59
+ */
60
+ export async function executeCommand(command, browser) {
61
+ try {
62
+ switch (command.action) {
63
+ case 'launch':
64
+ return await handleLaunch(command, browser);
65
+ case 'navigate':
66
+ return await handleNavigate(command, browser);
67
+ case 'click':
68
+ return await handleClick(command, browser);
69
+ case 'type':
70
+ return await handleType(command, browser);
71
+ case 'fill':
72
+ return await handleFill(command, browser);
73
+ case 'check':
74
+ return await handleCheck(command, browser);
75
+ case 'uncheck':
76
+ return await handleUncheck(command, browser);
77
+ case 'upload':
78
+ return await handleUpload(command, browser);
79
+ case 'dblclick':
80
+ return await handleDoubleClick(command, browser);
81
+ case 'focus':
82
+ return await handleFocus(command, browser);
83
+ case 'drag':
84
+ return await handleDrag(command, browser);
85
+ case 'frame':
86
+ return await handleFrame(command, browser);
87
+ case 'mainframe':
88
+ return await handleMainFrame(command, browser);
89
+ case 'getbyrole':
90
+ return await handleGetByRole(command, browser);
91
+ case 'getbytext':
92
+ return await handleGetByText(command, browser);
93
+ case 'getbylabel':
94
+ return await handleGetByLabel(command, browser);
95
+ case 'getbyplaceholder':
96
+ return await handleGetByPlaceholder(command, browser);
97
+ case 'press':
98
+ return await handlePress(command, browser);
99
+ case 'screenshot':
100
+ return await handleScreenshot(command, browser);
101
+ case 'snapshot':
102
+ return await handleSnapshot(command, browser);
103
+ case 'evaluate':
104
+ return await handleEvaluate(command, browser);
105
+ case 'wait':
106
+ return await handleWait(command, browser);
107
+ case 'scroll':
108
+ return await handleScroll(command, browser);
109
+ case 'select':
110
+ return await handleSelect(command, browser);
111
+ case 'hover':
112
+ return await handleHover(command, browser);
113
+ case 'content':
114
+ return await handleContent(command, browser);
115
+ case 'close':
116
+ return await handleClose(command, browser);
117
+ case 'tab_new':
118
+ return await handleTabNew(command, browser);
119
+ case 'tab_list':
120
+ return await handleTabList(command, browser);
121
+ case 'tab_switch':
122
+ return await handleTabSwitch(command, browser);
123
+ case 'tab_close':
124
+ return await handleTabClose(command, browser);
125
+ case 'window_new':
126
+ return await handleWindowNew(command, browser);
127
+ case 'cookies_get':
128
+ return await handleCookiesGet(command, browser);
129
+ case 'cookies_set':
130
+ return await handleCookiesSet(command, browser);
131
+ case 'cookies_clear':
132
+ return await handleCookiesClear(command, browser);
133
+ case 'storage_get':
134
+ return await handleStorageGet(command, browser);
135
+ case 'storage_set':
136
+ return await handleStorageSet(command, browser);
137
+ case 'storage_clear':
138
+ return await handleStorageClear(command, browser);
139
+ case 'dialog':
140
+ return await handleDialog(command, browser);
141
+ case 'pdf':
142
+ return await handlePdf(command, browser);
143
+ case 'route':
144
+ return await handleRoute(command, browser);
145
+ case 'unroute':
146
+ return await handleUnroute(command, browser);
147
+ case 'requests':
148
+ return await handleRequests(command, browser);
149
+ case 'download':
150
+ return await handleDownload(command, browser);
151
+ case 'geolocation':
152
+ return await handleGeolocation(command, browser);
153
+ case 'permissions':
154
+ return await handlePermissions(command, browser);
155
+ case 'viewport':
156
+ return await handleViewport(command, browser);
157
+ case 'useragent':
158
+ return await handleUserAgent(command, browser);
159
+ case 'device':
160
+ return await handleDevice(command, browser);
161
+ case 'back':
162
+ return await handleBack(command, browser);
163
+ case 'forward':
164
+ return await handleForward(command, browser);
165
+ case 'reload':
166
+ return await handleReload(command, browser);
167
+ case 'url':
168
+ return await handleUrl(command, browser);
169
+ case 'title':
170
+ return await handleTitle(command, browser);
171
+ case 'getattribute':
172
+ return await handleGetAttribute(command, browser);
173
+ case 'gettext':
174
+ return await handleGetText(command, browser);
175
+ case 'isvisible':
176
+ return await handleIsVisible(command, browser);
177
+ case 'isenabled':
178
+ return await handleIsEnabled(command, browser);
179
+ case 'ischecked':
180
+ return await handleIsChecked(command, browser);
181
+ case 'count':
182
+ return await handleCount(command, browser);
183
+ case 'boundingbox':
184
+ return await handleBoundingBox(command, browser);
185
+ case 'styles':
186
+ return await handleStyles(command, browser);
187
+ case 'video_start':
188
+ return await handleVideoStart(command, browser);
189
+ case 'video_stop':
190
+ return await handleVideoStop(command, browser);
191
+ case 'trace_start':
192
+ return await handleTraceStart(command, browser);
193
+ case 'trace_stop':
194
+ return await handleTraceStop(command, browser);
195
+ case 'profiler_start':
196
+ return await handleProfilerStart(command, browser);
197
+ case 'profiler_stop':
198
+ return await handleProfilerStop(command, browser);
199
+ case 'har_start':
200
+ return await handleHarStart(command, browser);
201
+ case 'har_stop':
202
+ return await handleHarStop(command, browser);
203
+ case 'state_save':
204
+ return await handleStateSave(command, browser);
205
+ case 'state_load':
206
+ return await handleStateLoad(command, browser);
207
+ case 'state_list':
208
+ return await handleStateList(command);
209
+ case 'state_clear':
210
+ return await handleStateClear(command);
211
+ case 'state_show':
212
+ return await handleStateShow(command);
213
+ case 'state_clean':
214
+ return await handleStateClean(command);
215
+ case 'state_rename':
216
+ return await handleStateRename(command);
217
+ case 'console':
218
+ return await handleConsole(command, browser);
219
+ case 'errors':
220
+ return await handleErrors(command, browser);
221
+ case 'keyboard':
222
+ return await handleKeyboard(command, browser);
223
+ case 'wheel':
224
+ return await handleWheel(command, browser);
225
+ case 'tap':
226
+ return await handleTap(command, browser);
227
+ case 'clipboard':
228
+ return await handleClipboard(command, browser);
229
+ case 'highlight':
230
+ return await handleHighlight(command, browser);
231
+ case 'clear':
232
+ return await handleClear(command, browser);
233
+ case 'selectall':
234
+ return await handleSelectAll(command, browser);
235
+ case 'innertext':
236
+ return await handleInnerText(command, browser);
237
+ case 'innerhtml':
238
+ return await handleInnerHtml(command, browser);
239
+ case 'inputvalue':
240
+ return await handleInputValue(command, browser);
241
+ case 'setvalue':
242
+ return await handleSetValue(command, browser);
243
+ case 'dispatch':
244
+ return await handleDispatch(command, browser);
245
+ case 'evalhandle':
246
+ return await handleEvalHandle(command, browser);
247
+ case 'expose':
248
+ return await handleExpose(command, browser);
249
+ case 'addscript':
250
+ return await handleAddScript(command, browser);
251
+ case 'addstyle':
252
+ return await handleAddStyle(command, browser);
253
+ case 'emulatemedia':
254
+ return await handleEmulateMedia(command, browser);
255
+ case 'offline':
256
+ return await handleOffline(command, browser);
257
+ case 'headers':
258
+ return await handleHeaders(command, browser);
259
+ case 'pause':
260
+ return await handlePause(command, browser);
261
+ case 'getbyalttext':
262
+ return await handleGetByAltText(command, browser);
263
+ case 'getbytitle':
264
+ return await handleGetByTitle(command, browser);
265
+ case 'getbytestid':
266
+ return await handleGetByTestId(command, browser);
267
+ case 'nth':
268
+ return await handleNth(command, browser);
269
+ case 'waitforurl':
270
+ return await handleWaitForUrl(command, browser);
271
+ case 'waitforloadstate':
272
+ return await handleWaitForLoadState(command, browser);
273
+ case 'setcontent':
274
+ return await handleSetContent(command, browser);
275
+ case 'timezone':
276
+ return await handleTimezone(command, browser);
277
+ case 'locale':
278
+ return await handleLocale(command, browser);
279
+ case 'credentials':
280
+ return await handleCredentials(command, browser);
281
+ case 'mousemove':
282
+ return await handleMouseMove(command, browser);
283
+ case 'mousedown':
284
+ return await handleMouseDown(command, browser);
285
+ case 'mouseup':
286
+ return await handleMouseUp(command, browser);
287
+ case 'bringtofront':
288
+ return await handleBringToFront(command, browser);
289
+ case 'waitforfunction':
290
+ return await handleWaitForFunction(command, browser);
291
+ case 'scrollintoview':
292
+ return await handleScrollIntoView(command, browser);
293
+ case 'addinitscript':
294
+ return await handleAddInitScript(command, browser);
295
+ case 'keydown':
296
+ return await handleKeyDown(command, browser);
297
+ case 'keyup':
298
+ return await handleKeyUp(command, browser);
299
+ case 'inserttext':
300
+ return await handleInsertText(command, browser);
301
+ case 'multiselect':
302
+ return await handleMultiSelect(command, browser);
303
+ case 'waitfordownload':
304
+ return await handleWaitForDownload(command, browser);
305
+ case 'responsebody':
306
+ return await handleResponseBody(command, browser);
307
+ case 'screencast_start':
308
+ return await handleScreencastStart(command, browser);
309
+ case 'screencast_stop':
310
+ return await handleScreencastStop(command, browser);
311
+ case 'input_mouse':
312
+ return await handleInputMouse(command, browser);
313
+ case 'input_keyboard':
314
+ return await handleInputKeyboard(command, browser);
315
+ case 'input_touch':
316
+ return await handleInputTouch(command, browser);
317
+ case 'recording_start':
318
+ return await handleRecordingStart(command, browser);
319
+ case 'recording_stop':
320
+ return await handleRecordingStop(command, browser);
321
+ case 'recording_restart':
322
+ return await handleRecordingRestart(command, browser);
323
+ case 'diff_snapshot':
324
+ return await handleDiffSnapshot(command, browser);
325
+ case 'diff_screenshot':
326
+ return await handleDiffScreenshot(command, browser);
327
+ case 'diff_url':
328
+ return await handleDiffUrl(command, browser);
329
+ default: {
330
+ // TypeScript narrows to never here, but we handle it for safety
331
+ const unknownCommand = command;
332
+ return errorResponse(unknownCommand.id, `Unknown action: ${unknownCommand.action}`);
333
+ }
334
+ }
335
+ }
336
+ catch (error) {
337
+ const message = error instanceof Error ? error.message : String(error);
338
+ return errorResponse(command.id, message);
339
+ }
340
+ }
341
+ async function handleLaunch(command, browser) {
342
+ await browser.launch(command);
343
+ return successResponse(command.id, {
344
+ launched: true,
345
+ stealth: browser.getStealthStatus(command.browser ?? 'chromium'),
346
+ });
347
+ }
348
+ async function handleNavigate(command, browser) {
349
+ const page = browser.getPage();
350
+ // If headers are provided, set up scoped headers for this origin
351
+ if (command.headers && Object.keys(command.headers).length > 0) {
352
+ await browser.setScopedHeaders(command.url, command.headers);
353
+ }
354
+ await page.goto(command.url, {
355
+ waitUntil: command.waitUntil ?? 'load',
356
+ });
357
+ return successResponse(command.id, {
358
+ url: page.url(),
359
+ title: await page.title(),
360
+ });
361
+ }
362
+ function bezierPoint(t, p0, p1, p2, p3) {
363
+ const u = 1 - t;
364
+ return u * u * u * p0 + 3 * u * u * t * p1 + 3 * u * t * t * p2 + t * t * t * p3;
365
+ }
366
+ async function humanMouseMove(page, toX, toY) {
367
+ const viewport = page.viewportSize();
368
+ const fromX = viewport ? Math.random() * viewport.width * 0.3 : 100;
369
+ const fromY = viewport ? Math.random() * viewport.height * 0.3 : 100;
370
+ const cp1x = fromX + (toX - fromX) * (0.2 + Math.random() * 0.3);
371
+ const cp1y = fromY + (Math.random() - 0.5) * 200;
372
+ const cp2x = fromX + (toX - fromX) * (0.5 + Math.random() * 0.3);
373
+ const cp2y = toY + (Math.random() - 0.5) * 200;
374
+ const steps = 15 + Math.floor(Math.random() * 15);
375
+ for (let i = 0; i <= steps; i++) {
376
+ const t = i / steps;
377
+ const x = bezierPoint(t, fromX, cp1x, cp2x, toX);
378
+ const y = bezierPoint(t, fromY, cp1y, cp2y, toY);
379
+ await page.mouse.move(x, y);
380
+ }
381
+ }
382
+ async function handleClick(command, browser) {
383
+ // Support both refs (@e1) and regular selectors
384
+ const locator = browser.getLocator(command.selector);
385
+ try {
386
+ // If --new-tab flag is set, get the href and open in a new tab
387
+ if (command.newTab) {
388
+ const fullUrl = await locator.evaluate((el) => {
389
+ const href = el.getAttribute('href');
390
+ // URL and document.baseURI are available in the browser context
391
+ return href
392
+ ? new globalThis.URL(href, globalThis.document.baseURI).toString()
393
+ : '';
394
+ });
395
+ if (!fullUrl) {
396
+ throw new Error(`Element '${command.selector}' does not have an href attribute. --new-tab only works on links.`);
397
+ }
398
+ await browser.newTab();
399
+ const newPage = browser.getPage();
400
+ await newPage.goto(fullUrl);
401
+ return successResponse(command.id, {
402
+ clicked: true,
403
+ newTab: true,
404
+ url: fullUrl,
405
+ });
406
+ }
407
+ // Human-like: move mouse along a Bezier curve before clicking
408
+ const box = await locator.boundingBox();
409
+ if (box) {
410
+ const targetX = box.x + box.width * (0.3 + Math.random() * 0.4);
411
+ const targetY = box.y + box.height * (0.3 + Math.random() * 0.4);
412
+ await humanMouseMove(browser.getPage(), targetX, targetY);
413
+ }
414
+ await locator.click({
415
+ button: command.button,
416
+ clickCount: command.clickCount,
417
+ delay: command.delay,
418
+ });
419
+ }
420
+ catch (error) {
421
+ throw toAIFriendlyError(error, command.selector);
422
+ }
423
+ return successResponse(command.id, { clicked: true });
424
+ }
425
+ async function handleType(command, browser) {
426
+ const locator = browser.getLocator(command.selector);
427
+ try {
428
+ if (command.clear) {
429
+ await locator.fill('');
430
+ }
431
+ if (command.delay) {
432
+ // Humanized: type char-by-char with randomized delay (+-40%)
433
+ await locator.focus();
434
+ const page = browser.getPage();
435
+ for (const char of command.text) {
436
+ const jitter = command.delay * (0.6 + Math.random() * 0.8);
437
+ await page.keyboard.type(char, { delay: 0 });
438
+ await page.waitForTimeout(jitter);
439
+ }
440
+ }
441
+ else {
442
+ await locator.pressSequentially(command.text, {});
443
+ }
444
+ }
445
+ catch (error) {
446
+ throw toAIFriendlyError(error, command.selector);
447
+ }
448
+ return successResponse(command.id, { typed: true });
449
+ }
450
+ async function handlePress(command, browser) {
451
+ const page = browser.getPage();
452
+ if (command.selector) {
453
+ await page.press(command.selector, command.key);
454
+ }
455
+ else {
456
+ await page.keyboard.press(command.key);
457
+ }
458
+ return successResponse(command.id, { pressed: true });
459
+ }
460
+ const ANNOTATION_OVERLAY_ID = '__agent_browser_annotations__';
461
+ async function removeAnnotationOverlay(page) {
462
+ await page
463
+ .evaluate(`(() => { const el = document.getElementById(${JSON.stringify(ANNOTATION_OVERLAY_ID)}); if (el) el.remove(); })()`)
464
+ .catch(() => { });
465
+ }
466
+ async function handleScreenshot(command, browser) {
467
+ const page = browser.getPage();
468
+ const options = {
469
+ fullPage: command.fullPage,
470
+ type: command.format ?? 'png',
471
+ };
472
+ if (command.format === 'jpeg' && command.quality !== undefined) {
473
+ options.quality = command.quality;
474
+ }
475
+ let target = page;
476
+ if (command.selector) {
477
+ target = browser.getLocator(command.selector);
478
+ }
479
+ let overlayInjected = false;
480
+ try {
481
+ let savePath = command.path;
482
+ if (!savePath) {
483
+ const ext = command.format === 'jpeg' ? 'jpg' : 'png';
484
+ const timestamp = new Date().toISOString().replace(/[:.]/g, '-');
485
+ const random = Math.random().toString(36).substring(2, 8);
486
+ const filename = `screenshot-${timestamp}-${random}.${ext}`;
487
+ const screenshotDir = path.join(getAppDir(), 'tmp', 'screenshots');
488
+ mkdirSync(screenshotDir, { recursive: true });
489
+ savePath = path.join(screenshotDir, filename);
490
+ }
491
+ let annotations;
492
+ if (command.annotate) {
493
+ const { refs } = await browser.getSnapshot({ interactive: true });
494
+ const entries = Object.entries(refs);
495
+ const results = await Promise.all(entries.map(async ([ref, data]) => {
496
+ try {
497
+ const locator = browser.getLocatorFromRef(ref);
498
+ if (!locator)
499
+ return null;
500
+ const box = await locator.boundingBox();
501
+ if (!box || box.width === 0 || box.height === 0)
502
+ return null;
503
+ const num = parseInt(ref.replace('e', ''), 10);
504
+ return {
505
+ ref,
506
+ number: num,
507
+ role: data.role,
508
+ name: data.name || undefined,
509
+ box: {
510
+ x: Math.round(box.x),
511
+ y: Math.round(box.y),
512
+ width: Math.round(box.width),
513
+ height: Math.round(box.height),
514
+ },
515
+ };
516
+ }
517
+ catch {
518
+ return null;
519
+ }
520
+ }));
521
+ // When a selector is provided the screenshot is cropped to that element,
522
+ // so filter to annotations that overlap the target and shift coordinates.
523
+ let targetBox = null;
524
+ if (command.selector) {
525
+ const raw = await browser.getLocator(command.selector).boundingBox();
526
+ if (raw) {
527
+ targetBox = {
528
+ x: Math.round(raw.x),
529
+ y: Math.round(raw.y),
530
+ width: Math.round(raw.width),
531
+ height: Math.round(raw.height),
532
+ };
533
+ }
534
+ }
535
+ const filtered = results.filter((a) => a !== null);
536
+ // Filter by selector overlap if needed, but keep viewport-relative coords
537
+ // for overlay positioning. Coordinate shifting happens later for metadata only.
538
+ let overlayItems;
539
+ if (targetBox) {
540
+ const tb = targetBox;
541
+ overlayItems = filtered
542
+ .filter((a) => {
543
+ const ax2 = a.box.x + a.box.width;
544
+ const ay2 = a.box.y + a.box.height;
545
+ const bx2 = tb.x + tb.width;
546
+ const by2 = tb.y + tb.height;
547
+ return a.box.x < bx2 && ax2 > tb.x && a.box.y < by2 && ay2 > tb.y;
548
+ })
549
+ .sort((a, b) => a.number - b.number);
550
+ }
551
+ else {
552
+ overlayItems = filtered.sort((a, b) => a.number - b.number);
553
+ }
554
+ if (overlayItems.length > 0) {
555
+ const overlayData = overlayItems.map((a) => ({
556
+ number: a.number,
557
+ x: a.box.x,
558
+ y: a.box.y,
559
+ width: a.box.width,
560
+ height: a.box.height,
561
+ }));
562
+ // Uses position:absolute with document-relative coords so labels render
563
+ // correctly for both viewport and fullPage screenshots, and when the
564
+ // screenshot is scoped to a selector element.
565
+ await page.evaluate(`(() => {
566
+ var items = ${JSON.stringify(overlayData)};
567
+ var id = ${JSON.stringify(ANNOTATION_OVERLAY_ID)};
568
+ var sx = window.scrollX || 0;
569
+ var sy = window.scrollY || 0;
570
+ var c = document.createElement('div');
571
+ c.id = id;
572
+ c.style.cssText = 'position:absolute;top:0;left:0;width:0;height:0;pointer-events:none;z-index:2147483647;';
573
+ for (var i = 0; i < items.length; i++) {
574
+ var it = items[i];
575
+ var dx = it.x + sx;
576
+ var dy = it.y + sy;
577
+ var b = document.createElement('div');
578
+ b.style.cssText = 'position:absolute;left:' + dx + 'px;top:' + dy + 'px;width:' + it.width + 'px;height:' + it.height + 'px;border:2px solid rgba(255,0,0,0.8);box-sizing:border-box;pointer-events:none;';
579
+ var l = document.createElement('div');
580
+ l.textContent = String(it.number);
581
+ var labelTop = dy < 14 ? '2px' : '-14px';
582
+ l.style.cssText = 'position:absolute;top:' + labelTop + ';left:-2px;background:rgba(255,0,0,0.9);color:#fff;font:bold 11px/14px monospace;padding:0 4px;border-radius:2px;white-space:nowrap;';
583
+ b.appendChild(l);
584
+ c.appendChild(b);
585
+ }
586
+ document.documentElement.appendChild(c);
587
+ })()`);
588
+ overlayInjected = true;
589
+ }
590
+ // Build returned annotation metadata with image-relative coordinates.
591
+ // Selector: shift to target-element-relative.
592
+ // fullPage: convert to document-relative (matching fullPage image origin).
593
+ // Default: viewport-relative (unchanged).
594
+ if (targetBox) {
595
+ const tb = targetBox;
596
+ annotations = overlayItems.map((a) => ({
597
+ ...a,
598
+ box: {
599
+ x: a.box.x - tb.x,
600
+ y: a.box.y - tb.y,
601
+ width: a.box.width,
602
+ height: a.box.height,
603
+ },
604
+ }));
605
+ }
606
+ else if (command.fullPage) {
607
+ const scroll = (await page.evaluate(`({x: window.scrollX || 0, y: window.scrollY || 0})`));
608
+ annotations = overlayItems.map((a) => ({
609
+ ...a,
610
+ box: {
611
+ x: a.box.x + scroll.x,
612
+ y: a.box.y + scroll.y,
613
+ width: a.box.width,
614
+ height: a.box.height,
615
+ },
616
+ }));
617
+ }
618
+ else {
619
+ annotations = overlayItems;
620
+ }
621
+ }
622
+ await target.screenshot({ ...options, path: savePath });
623
+ if (overlayInjected) {
624
+ await removeAnnotationOverlay(page);
625
+ }
626
+ return successResponse(command.id, {
627
+ path: savePath,
628
+ ...(annotations && annotations.length > 0 ? { annotations } : {}),
629
+ });
630
+ }
631
+ catch (error) {
632
+ if (overlayInjected) {
633
+ await removeAnnotationOverlay(page);
634
+ }
635
+ if (command.selector) {
636
+ throw toAIFriendlyError(error, command.selector);
637
+ }
638
+ throw error;
639
+ }
640
+ }
641
+ async function handleSnapshot(command, browser) {
642
+ // Use enhanced snapshot with refs and optional filtering
643
+ const { tree, refs } = await browser.getSnapshot({
644
+ interactive: command.interactive,
645
+ cursor: command.cursor,
646
+ maxDepth: command.maxDepth,
647
+ compact: command.compact,
648
+ selector: command.selector,
649
+ });
650
+ // Simplify refs for output (just role and name)
651
+ const simpleRefs = {};
652
+ for (const [ref, data] of Object.entries(refs)) {
653
+ simpleRefs[ref] = { role: data.role, name: data.name };
654
+ }
655
+ return successResponse(command.id, {
656
+ snapshot: tree || 'Empty page',
657
+ refs: Object.keys(simpleRefs).length > 0 ? simpleRefs : undefined,
658
+ });
659
+ }
660
+ async function handleEvaluate(command, browser) {
661
+ const page = browser.getPage();
662
+ // Evaluate the script directly as a string expression
663
+ const result = await page.evaluate(command.script);
664
+ return successResponse(command.id, { result });
665
+ }
666
+ async function handleWait(command, browser) {
667
+ const page = browser.getPage();
668
+ if (command.selector) {
669
+ await page.waitForSelector(command.selector, {
670
+ state: command.state ?? 'visible',
671
+ timeout: command.timeout,
672
+ });
673
+ }
674
+ else if (command.timeout) {
675
+ // Random range: wait between [timeout, timeoutMax]
676
+ const min = command.timeout;
677
+ const max = command.timeoutMax ?? min;
678
+ const delay = max > min ? min + Math.random() * (max - min) : min;
679
+ await page.waitForTimeout(Math.round(delay));
680
+ }
681
+ else {
682
+ // Default: wait for load state
683
+ await page.waitForLoadState('load');
684
+ }
685
+ return successResponse(command.id, { waited: true });
686
+ }
687
+ async function handleScroll(command, browser) {
688
+ const page = browser.getPage();
689
+ if (command.selector) {
690
+ const element = browser.getLocator(command.selector);
691
+ await element.scrollIntoViewIfNeeded();
692
+ if (command.x !== undefined || command.y !== undefined) {
693
+ await element.evaluate((el, { x, y }) => {
694
+ el.scrollBy(x ?? 0, y ?? 0);
695
+ }, { x: command.x, y: command.y });
696
+ }
697
+ }
698
+ else {
699
+ // Scroll the page
700
+ let deltaX = command.x ?? 0;
701
+ let deltaY = command.y ?? 0;
702
+ if (command.direction) {
703
+ const amount = command.amount ?? 100;
704
+ switch (command.direction) {
705
+ case 'up':
706
+ deltaY = -amount;
707
+ break;
708
+ case 'down':
709
+ deltaY = amount;
710
+ break;
711
+ case 'left':
712
+ deltaX = -amount;
713
+ break;
714
+ case 'right':
715
+ deltaX = amount;
716
+ break;
717
+ }
718
+ }
719
+ await page.evaluate(`window.scrollBy(${deltaX}, ${deltaY})`);
720
+ }
721
+ return successResponse(command.id, { scrolled: true });
722
+ }
723
+ async function handleSelect(command, browser) {
724
+ const locator = browser.getLocator(command.selector);
725
+ const values = Array.isArray(command.values) ? command.values : [command.values];
726
+ try {
727
+ await locator.selectOption(values);
728
+ }
729
+ catch (error) {
730
+ throw toAIFriendlyError(error, command.selector);
731
+ }
732
+ return successResponse(command.id, { selected: values });
733
+ }
734
+ async function handleHover(command, browser) {
735
+ const locator = browser.getLocator(command.selector);
736
+ try {
737
+ await locator.hover();
738
+ }
739
+ catch (error) {
740
+ throw toAIFriendlyError(error, command.selector);
741
+ }
742
+ return successResponse(command.id, { hovered: true });
743
+ }
744
+ async function handleContent(command, browser) {
745
+ const page = browser.getPage();
746
+ let html;
747
+ if (command.selector) {
748
+ html = await page.locator(command.selector).innerHTML();
749
+ }
750
+ else {
751
+ html = await page.content();
752
+ }
753
+ return successResponse(command.id, { html });
754
+ }
755
+ async function handleClose(command, browser) {
756
+ await browser.close();
757
+ return successResponse(command.id, { closed: true });
758
+ }
759
+ async function handleTabNew(command, browser) {
760
+ const result = await browser.newTab();
761
+ // Navigate to URL if provided (same pattern as handleNavigate)
762
+ if (command.url) {
763
+ const page = browser.getPage();
764
+ await page.goto(command.url, { waitUntil: 'domcontentloaded' });
765
+ }
766
+ return successResponse(command.id, result);
767
+ }
768
+ async function handleTabList(command, browser) {
769
+ const tabs = await browser.listTabs();
770
+ return successResponse(command.id, {
771
+ tabs,
772
+ active: browser.getActiveIndex(),
773
+ });
774
+ }
775
+ async function handleTabSwitch(command, browser) {
776
+ const result = await browser.switchTo(command.index);
777
+ const page = browser.getPage();
778
+ return successResponse(command.id, {
779
+ ...result,
780
+ title: await page.title(),
781
+ });
782
+ }
783
+ async function handleTabClose(command, browser) {
784
+ const result = await browser.closeTab(command.index);
785
+ return successResponse(command.id, result);
786
+ }
787
+ async function handleWindowNew(command, browser) {
788
+ const result = await browser.newWindow(command.viewport);
789
+ return successResponse(command.id, result);
790
+ }
791
+ // New handlers for enhanced Playwright parity
792
+ async function handleFill(command, browser) {
793
+ const locator = browser.getLocator(command.selector);
794
+ try {
795
+ await locator.fill(command.value);
796
+ }
797
+ catch (error) {
798
+ throw toAIFriendlyError(error, command.selector);
799
+ }
800
+ return successResponse(command.id, { filled: true });
801
+ }
802
+ async function handleCheck(command, browser) {
803
+ const locator = browser.getLocator(command.selector);
804
+ try {
805
+ await locator.check();
806
+ }
807
+ catch (error) {
808
+ throw toAIFriendlyError(error, command.selector);
809
+ }
810
+ return successResponse(command.id, { checked: true });
811
+ }
812
+ async function handleUncheck(command, browser) {
813
+ const locator = browser.getLocator(command.selector);
814
+ try {
815
+ await locator.uncheck();
816
+ }
817
+ catch (error) {
818
+ throw toAIFriendlyError(error, command.selector);
819
+ }
820
+ return successResponse(command.id, { unchecked: true });
821
+ }
822
+ async function handleUpload(command, browser) {
823
+ const locator = browser.getLocator(command.selector);
824
+ const files = Array.isArray(command.files) ? command.files : [command.files];
825
+ try {
826
+ await locator.setInputFiles(files);
827
+ }
828
+ catch (error) {
829
+ throw toAIFriendlyError(error, command.selector);
830
+ }
831
+ return successResponse(command.id, { uploaded: files });
832
+ }
833
+ async function handleDoubleClick(command, browser) {
834
+ const locator = browser.getLocator(command.selector);
835
+ try {
836
+ await locator.dblclick();
837
+ }
838
+ catch (error) {
839
+ throw toAIFriendlyError(error, command.selector);
840
+ }
841
+ return successResponse(command.id, { clicked: true });
842
+ }
843
+ async function handleFocus(command, browser) {
844
+ const locator = browser.getLocator(command.selector);
845
+ try {
846
+ await locator.focus();
847
+ }
848
+ catch (error) {
849
+ throw toAIFriendlyError(error, command.selector);
850
+ }
851
+ return successResponse(command.id, { focused: true });
852
+ }
853
+ async function handleDrag(command, browser) {
854
+ const frame = browser.getFrame();
855
+ await frame.dragAndDrop(command.source, command.target);
856
+ return successResponse(command.id, { dragged: true });
857
+ }
858
+ async function handleFrame(command, browser) {
859
+ await browser.switchToFrame({
860
+ selector: command.selector,
861
+ name: command.name,
862
+ url: command.url,
863
+ });
864
+ return successResponse(command.id, { switched: true });
865
+ }
866
+ async function handleMainFrame(command, browser) {
867
+ browser.switchToMainFrame();
868
+ return successResponse(command.id, { switched: true });
869
+ }
870
+ async function handleGetByRole(command, browser) {
871
+ const page = browser.getPage();
872
+ const locator = page.getByRole(command.role, { name: command.name, exact: command.exact });
873
+ switch (command.subaction) {
874
+ case 'click':
875
+ await locator.click();
876
+ return successResponse(command.id, { clicked: true });
877
+ case 'fill':
878
+ await locator.fill(command.value ?? '');
879
+ return successResponse(command.id, { filled: true });
880
+ case 'check':
881
+ await locator.check();
882
+ return successResponse(command.id, { checked: true });
883
+ case 'hover':
884
+ await locator.hover();
885
+ return successResponse(command.id, { hovered: true });
886
+ }
887
+ }
888
+ async function handleGetByText(command, browser) {
889
+ const page = browser.getPage();
890
+ const locator = page.getByText(command.text, { exact: command.exact });
891
+ switch (command.subaction) {
892
+ case 'click':
893
+ await locator.click();
894
+ return successResponse(command.id, { clicked: true });
895
+ case 'hover':
896
+ await locator.hover();
897
+ return successResponse(command.id, { hovered: true });
898
+ }
899
+ }
900
+ async function handleGetByLabel(command, browser) {
901
+ const page = browser.getPage();
902
+ const locator = page.getByLabel(command.label, { exact: command.exact });
903
+ switch (command.subaction) {
904
+ case 'click':
905
+ await locator.click();
906
+ return successResponse(command.id, { clicked: true });
907
+ case 'fill':
908
+ await locator.fill(command.value ?? '');
909
+ return successResponse(command.id, { filled: true });
910
+ case 'check':
911
+ await locator.check();
912
+ return successResponse(command.id, { checked: true });
913
+ }
914
+ }
915
+ async function handleGetByPlaceholder(command, browser) {
916
+ const page = browser.getPage();
917
+ const locator = page.getByPlaceholder(command.placeholder, { exact: command.exact });
918
+ switch (command.subaction) {
919
+ case 'click':
920
+ await locator.click();
921
+ return successResponse(command.id, { clicked: true });
922
+ case 'fill':
923
+ await locator.fill(command.value ?? '');
924
+ return successResponse(command.id, { filled: true });
925
+ }
926
+ }
927
+ async function handleCookiesGet(command, browser) {
928
+ const page = browser.getPage();
929
+ const context = page.context();
930
+ const cookies = await context.cookies(command.urls);
931
+ return successResponse(command.id, { cookies });
932
+ }
933
+ async function handleCookiesSet(command, browser) {
934
+ const page = browser.getPage();
935
+ const context = page.context();
936
+ // Auto-fill URL for cookies that don't have domain/path/url set
937
+ const pageUrl = page.url();
938
+ const cookies = command.cookies.map((cookie) => {
939
+ if (!cookie.url && !cookie.domain && !cookie.path) {
940
+ return { ...cookie, url: pageUrl };
941
+ }
942
+ return cookie;
943
+ });
944
+ await context.addCookies(cookies);
945
+ return successResponse(command.id, { set: true });
946
+ }
947
+ async function handleCookiesClear(command, browser) {
948
+ const page = browser.getPage();
949
+ const context = page.context();
950
+ await context.clearCookies();
951
+ return successResponse(command.id, { cleared: true });
952
+ }
953
+ async function handleStorageGet(command, browser) {
954
+ const page = browser.getPage();
955
+ const storageType = command.type === 'local' ? 'localStorage' : 'sessionStorage';
956
+ if (command.key) {
957
+ const value = await page.evaluate(`${storageType}.getItem(${JSON.stringify(command.key)})`);
958
+ return successResponse(command.id, { key: command.key, value });
959
+ }
960
+ else {
961
+ const data = await page.evaluate(`
962
+ (() => {
963
+ const storage = ${storageType};
964
+ const result = {};
965
+ for (let i = 0; i < storage.length; i++) {
966
+ const key = storage.key(i);
967
+ if (key) result[key] = storage.getItem(key);
968
+ }
969
+ return result;
970
+ })()
971
+ `);
972
+ return successResponse(command.id, { data });
973
+ }
974
+ }
975
+ async function handleStorageSet(command, browser) {
976
+ const page = browser.getPage();
977
+ const storageType = command.type === 'local' ? 'localStorage' : 'sessionStorage';
978
+ await page.evaluate(`${storageType}.setItem(${JSON.stringify(command.key)}, ${JSON.stringify(command.value)})`);
979
+ return successResponse(command.id, { set: true });
980
+ }
981
+ async function handleStorageClear(command, browser) {
982
+ const page = browser.getPage();
983
+ const storageType = command.type === 'local' ? 'localStorage' : 'sessionStorage';
984
+ await page.evaluate(`${storageType}.clear()`);
985
+ return successResponse(command.id, { cleared: true });
986
+ }
987
+ async function handleDialog(command, browser) {
988
+ browser.setDialogHandler(command.response, command.promptText);
989
+ return successResponse(command.id, { handler: 'set', response: command.response });
990
+ }
991
+ async function handlePdf(command, browser) {
992
+ const page = browser.getPage();
993
+ await page.pdf({
994
+ path: command.path,
995
+ format: command.format ?? 'Letter',
996
+ });
997
+ return successResponse(command.id, { path: command.path });
998
+ }
999
+ // Network & Request handlers
1000
+ async function handleRoute(command, browser) {
1001
+ await browser.addRoute(command.url, {
1002
+ response: command.response,
1003
+ abort: command.abort,
1004
+ });
1005
+ return successResponse(command.id, { routed: command.url });
1006
+ }
1007
+ async function handleUnroute(command, browser) {
1008
+ await browser.removeRoute(command.url);
1009
+ return successResponse(command.id, { unrouted: command.url ?? 'all' });
1010
+ }
1011
+ async function handleRequests(command, browser) {
1012
+ if (command.clear) {
1013
+ browser.clearRequests();
1014
+ return successResponse(command.id, { cleared: true });
1015
+ }
1016
+ // Start tracking if not already
1017
+ browser.startRequestTracking();
1018
+ const requests = browser.getRequests(command.filter);
1019
+ return successResponse(command.id, { requests });
1020
+ }
1021
+ async function handleDownload(command, browser) {
1022
+ const page = browser.getPage();
1023
+ const locator = browser.getLocator(command.selector);
1024
+ const [download] = await Promise.all([page.waitForEvent('download'), locator.click()]);
1025
+ await download.saveAs(command.path);
1026
+ return successResponse(command.id, {
1027
+ path: command.path,
1028
+ suggestedFilename: download.suggestedFilename(),
1029
+ });
1030
+ }
1031
+ async function handleGeolocation(command, browser) {
1032
+ await browser.setGeolocation(command.latitude, command.longitude, command.accuracy);
1033
+ return successResponse(command.id, {
1034
+ latitude: command.latitude,
1035
+ longitude: command.longitude,
1036
+ });
1037
+ }
1038
+ async function handlePermissions(command, browser) {
1039
+ await browser.setPermissions(command.permissions, command.grant);
1040
+ return successResponse(command.id, {
1041
+ permissions: command.permissions,
1042
+ granted: command.grant,
1043
+ });
1044
+ }
1045
+ async function handleViewport(command, browser) {
1046
+ await browser.setViewport(command.width, command.height);
1047
+ return successResponse(command.id, {
1048
+ width: command.width,
1049
+ height: command.height,
1050
+ });
1051
+ }
1052
+ async function handleUserAgent(command, browser) {
1053
+ const page = browser.getPage();
1054
+ const context = page.context();
1055
+ // Note: Can't change user agent after context is created, but we can for new pages
1056
+ return successResponse(command.id, {
1057
+ note: 'User agent can only be set at launch time. Use device command instead.',
1058
+ });
1059
+ }
1060
+ async function handleDevice(command, browser) {
1061
+ const device = browser.getDevice(command.device);
1062
+ if (!device) {
1063
+ const available = browser.listDevices().slice(0, 10).join(', ');
1064
+ throw new Error(`Unknown device: ${command.device}. Available: ${available}...`);
1065
+ }
1066
+ // Apply device viewport
1067
+ await browser.setViewport(device.viewport.width, device.viewport.height);
1068
+ // Apply or clear device scale factor
1069
+ if (device.deviceScaleFactor && device.deviceScaleFactor !== 1) {
1070
+ // Apply device scale factor for HiDPI/retina displays
1071
+ await browser.setDeviceScaleFactor(device.deviceScaleFactor, device.viewport.width, device.viewport.height, device.isMobile ?? false);
1072
+ }
1073
+ else {
1074
+ // Clear device scale factor override to restore default (1x)
1075
+ try {
1076
+ await browser.clearDeviceMetricsOverride();
1077
+ }
1078
+ catch {
1079
+ // Ignore error if override was never set
1080
+ }
1081
+ }
1082
+ return successResponse(command.id, {
1083
+ device: command.device,
1084
+ viewport: device.viewport,
1085
+ userAgent: device.userAgent,
1086
+ deviceScaleFactor: device.deviceScaleFactor,
1087
+ });
1088
+ }
1089
+ async function handleBack(command, browser) {
1090
+ const page = browser.getPage();
1091
+ await page.goBack();
1092
+ return successResponse(command.id, { url: page.url() });
1093
+ }
1094
+ async function handleForward(command, browser) {
1095
+ const page = browser.getPage();
1096
+ await page.goForward();
1097
+ return successResponse(command.id, { url: page.url() });
1098
+ }
1099
+ async function handleReload(command, browser) {
1100
+ const page = browser.getPage();
1101
+ await page.reload();
1102
+ return successResponse(command.id, { url: page.url() });
1103
+ }
1104
+ async function handleUrl(command, browser) {
1105
+ const page = browser.getPage();
1106
+ return successResponse(command.id, { url: page.url() });
1107
+ }
1108
+ async function handleTitle(command, browser) {
1109
+ const page = browser.getPage();
1110
+ const title = await page.title();
1111
+ return successResponse(command.id, { title });
1112
+ }
1113
+ async function handleGetAttribute(command, browser) {
1114
+ const locator = browser.getLocator(command.selector);
1115
+ const value = await locator.getAttribute(command.attribute);
1116
+ return successResponse(command.id, { attribute: command.attribute, value });
1117
+ }
1118
+ async function handleGetText(command, browser) {
1119
+ const locator = browser.getLocator(command.selector);
1120
+ const text = await locator.textContent();
1121
+ return successResponse(command.id, { text });
1122
+ }
1123
+ async function handleIsVisible(command, browser) {
1124
+ const locator = browser.getLocator(command.selector);
1125
+ const visible = await locator.isVisible();
1126
+ return successResponse(command.id, { visible });
1127
+ }
1128
+ async function handleIsEnabled(command, browser) {
1129
+ const locator = browser.getLocator(command.selector);
1130
+ const enabled = await locator.isEnabled();
1131
+ return successResponse(command.id, { enabled });
1132
+ }
1133
+ async function handleIsChecked(command, browser) {
1134
+ const locator = browser.getLocator(command.selector);
1135
+ const checked = await locator.isChecked();
1136
+ return successResponse(command.id, { checked });
1137
+ }
1138
+ async function handleCount(command, browser) {
1139
+ const page = browser.getPage();
1140
+ const count = await page.locator(command.selector).count();
1141
+ return successResponse(command.id, { count });
1142
+ }
1143
+ async function handleBoundingBox(command, browser) {
1144
+ const page = browser.getPage();
1145
+ const box = await page.locator(command.selector).boundingBox();
1146
+ return successResponse(command.id, { box });
1147
+ }
1148
+ async function handleStyles(command, browser) {
1149
+ const page = browser.getPage();
1150
+ // Shared extraction logic as a string to be eval'd in browser context
1151
+ const extractStylesScript = `(function(el) {
1152
+ const s = getComputedStyle(el);
1153
+ const r = el.getBoundingClientRect();
1154
+ return {
1155
+ tag: el.tagName.toLowerCase(),
1156
+ text: el.innerText?.trim().slice(0, 80) || null,
1157
+ box: {
1158
+ x: Math.round(r.x),
1159
+ y: Math.round(r.y),
1160
+ width: Math.round(r.width),
1161
+ height: Math.round(r.height),
1162
+ },
1163
+ styles: {
1164
+ fontSize: s.fontSize,
1165
+ fontWeight: s.fontWeight,
1166
+ fontFamily: s.fontFamily.split(',')[0].trim().replace(/"/g, ''),
1167
+ color: s.color,
1168
+ backgroundColor: s.backgroundColor,
1169
+ borderRadius: s.borderRadius,
1170
+ border: s.border !== 'none' && s.borderWidth !== '0px' ? s.border : null,
1171
+ boxShadow: s.boxShadow !== 'none' ? s.boxShadow : null,
1172
+ padding: s.padding,
1173
+ },
1174
+ };
1175
+ })`;
1176
+ // Check if it's a ref - single element
1177
+ if (browser.isRef(command.selector)) {
1178
+ const locator = browser.getLocator(command.selector);
1179
+ const element = (await locator.evaluate((el, script) => {
1180
+ const fn = eval(script);
1181
+ return fn(el);
1182
+ }, extractStylesScript));
1183
+ return successResponse(command.id, { elements: [element] });
1184
+ }
1185
+ // CSS selector - can match multiple elements
1186
+ const elements = (await page.$$eval(command.selector, (els, script) => {
1187
+ const fn = eval(script);
1188
+ return els.map((el) => fn(el));
1189
+ }, extractStylesScript));
1190
+ return successResponse(command.id, { elements });
1191
+ }
1192
+ // Advanced handlers
1193
+ async function handleVideoStart(command, browser) {
1194
+ // Video recording requires context-level setup at launch
1195
+ // For now, return a note about this limitation
1196
+ return successResponse(command.id, {
1197
+ note: 'Video recording must be enabled at browser launch. Use --video flag when starting.',
1198
+ path: command.path,
1199
+ });
1200
+ }
1201
+ async function handleVideoStop(command, browser) {
1202
+ const page = browser.getPage();
1203
+ const video = page.video();
1204
+ if (video) {
1205
+ const path = await video.path();
1206
+ return successResponse(command.id, { path });
1207
+ }
1208
+ return successResponse(command.id, { note: 'No video recording active' });
1209
+ }
1210
+ async function handleTraceStart(command, browser) {
1211
+ await browser.startTracing({
1212
+ screenshots: command.screenshots,
1213
+ snapshots: command.snapshots,
1214
+ });
1215
+ return successResponse(command.id, { started: true });
1216
+ }
1217
+ async function handleTraceStop(command, browser) {
1218
+ await browser.stopTracing(command.path);
1219
+ return successResponse(command.id, command.path ? { path: command.path } : { traceStopped: true });
1220
+ }
1221
+ async function handleProfilerStart(command, browser) {
1222
+ await browser.startProfiling({ categories: command.categories });
1223
+ return successResponse(command.id, { started: true });
1224
+ }
1225
+ async function handleProfilerStop(command, browser) {
1226
+ let outputPath = command.path;
1227
+ if (!outputPath) {
1228
+ const timestamp = new Date().toISOString().replace(/[:.]/g, '-');
1229
+ const random = Math.random().toString(36).substring(2, 8);
1230
+ const filename = `profile-${timestamp}-${random}.json`;
1231
+ const profileDir = path.join(getAppDir(), 'tmp', 'profiles');
1232
+ mkdirSync(profileDir, { recursive: true });
1233
+ outputPath = path.join(profileDir, filename);
1234
+ }
1235
+ const result = await browser.stopProfiling(outputPath);
1236
+ return successResponse(command.id, result);
1237
+ }
1238
+ async function handleHarStart(command, browser) {
1239
+ await browser.startHarRecording();
1240
+ browser.startRequestTracking();
1241
+ return successResponse(command.id, { started: true });
1242
+ }
1243
+ async function handleHarStop(command, browser) {
1244
+ // HAR recording is handled at context level
1245
+ // For now, we save tracked requests as a simplified HAR-like format
1246
+ const requests = browser.getRequests();
1247
+ return successResponse(command.id, {
1248
+ path: command.path,
1249
+ requestCount: requests.length,
1250
+ });
1251
+ }
1252
+ async function handleStateSave(command, browser) {
1253
+ await browser.saveStorageState(command.path);
1254
+ return successResponse(command.id, { path: command.path });
1255
+ }
1256
+ async function handleStateLoad(command, browser) {
1257
+ if (browser.isLaunched()) {
1258
+ return errorResponse(command.id, 'Cannot load state while browser is running. Close browser first, then relaunch with loaded state.');
1259
+ }
1260
+ if (!fs.existsSync(command.path)) {
1261
+ return errorResponse(command.id, `State file not found: ${command.path}`);
1262
+ }
1263
+ await browser.launch({
1264
+ id: command.id,
1265
+ action: 'launch',
1266
+ headless: true,
1267
+ autoStateFilePath: command.path,
1268
+ });
1269
+ return successResponse(command.id, {
1270
+ loaded: true,
1271
+ path: command.path,
1272
+ });
1273
+ }
1274
+ async function handleStateList(command) {
1275
+ const sessionsDir = getSessionsDir();
1276
+ const files = listStateFiles();
1277
+ if (files.length === 0) {
1278
+ return successResponse(command.id, { files: [], directory: sessionsDir });
1279
+ }
1280
+ const stateFiles = files
1281
+ .map((filename) => {
1282
+ const filepath = path.join(sessionsDir, filename);
1283
+ const stats = fs.statSync(filepath);
1284
+ let encrypted = false;
1285
+ try {
1286
+ const content = fs.readFileSync(filepath, 'utf-8');
1287
+ const parsed = JSON.parse(content);
1288
+ encrypted = isEncryptedPayload(parsed);
1289
+ }
1290
+ catch {
1291
+ // Ignore parse errors
1292
+ }
1293
+ return {
1294
+ filename,
1295
+ path: filepath,
1296
+ size: stats.size,
1297
+ modified: stats.mtime.toISOString(),
1298
+ encrypted,
1299
+ };
1300
+ })
1301
+ .sort((a, b) => new Date(b.modified).getTime() - new Date(a.modified).getTime());
1302
+ return successResponse(command.id, { files: stateFiles, directory: sessionsDir });
1303
+ }
1304
+ async function handleStateClear(command) {
1305
+ const sessionsDir = getSessionsDir();
1306
+ if (command.sessionName && !isValidSessionName(command.sessionName)) {
1307
+ return errorResponse(command.id, 'Invalid session name. Use only letters, numbers, dashes, and underscores.');
1308
+ }
1309
+ const files = listStateFiles();
1310
+ if (files.length === 0) {
1311
+ return successResponse(command.id, { cleared: 0, deleted: [] });
1312
+ }
1313
+ const deleted = [];
1314
+ if (command.all) {
1315
+ for (const file of files) {
1316
+ fs.unlinkSync(path.join(sessionsDir, file));
1317
+ deleted.push(file);
1318
+ }
1319
+ }
1320
+ else if (command.sessionName) {
1321
+ for (const file of files) {
1322
+ if (file.startsWith(`${command.sessionName}-`)) {
1323
+ fs.unlinkSync(path.join(sessionsDir, file));
1324
+ deleted.push(file);
1325
+ }
1326
+ }
1327
+ }
1328
+ return successResponse(command.id, { cleared: deleted.length, deleted });
1329
+ }
1330
+ async function handleStateShow(command) {
1331
+ const sessionsDir = getSessionsDir();
1332
+ const baseName = command.filename.replace(/\.json$/, '');
1333
+ if (!command.filename.endsWith('.json') || !isValidSessionName(baseName)) {
1334
+ return errorResponse(command.id, 'Invalid filename. Use only letters, numbers, dashes, and underscores (with .json extension).');
1335
+ }
1336
+ const filepath = path.join(sessionsDir, command.filename);
1337
+ if (!fs.existsSync(filepath)) {
1338
+ return errorResponse(command.id, `State file not found: ${command.filename}`);
1339
+ }
1340
+ try {
1341
+ const { data: state, wasEncrypted } = readStateFile(filepath);
1342
+ const stats = fs.statSync(filepath);
1343
+ const stateObj = state;
1344
+ const cookies = stateObj.cookies?.length || 0;
1345
+ const origins = stateObj.origins?.length || 0;
1346
+ const domains = [...new Set((stateObj.cookies || []).map((c) => c.domain))];
1347
+ return successResponse(command.id, {
1348
+ filename: command.filename,
1349
+ path: filepath,
1350
+ size: stats.size,
1351
+ modified: stats.mtime.toISOString(),
1352
+ encrypted: wasEncrypted,
1353
+ summary: {
1354
+ cookies,
1355
+ origins,
1356
+ domains,
1357
+ },
1358
+ state,
1359
+ });
1360
+ }
1361
+ catch (e) {
1362
+ return errorResponse(command.id, `Failed to parse state file: ${e.message}`);
1363
+ }
1364
+ }
1365
+ async function handleStateClean(command) {
1366
+ const deleted = cleanupExpiredStates(command.days);
1367
+ const keptCount = listStateFiles().length;
1368
+ return successResponse(command.id, {
1369
+ cleaned: deleted.length,
1370
+ deleted,
1371
+ keptCount,
1372
+ days: command.days,
1373
+ });
1374
+ }
1375
+ async function handleStateRename(command) {
1376
+ const sessionsDir = getSessionsDir();
1377
+ if (!isValidSessionName(command.oldName) || !isValidSessionName(command.newName)) {
1378
+ return errorResponse(command.id, 'Invalid name. Use only letters, numbers, dashes, and underscores.');
1379
+ }
1380
+ const oldPath = path.join(sessionsDir, `${command.oldName}.json`);
1381
+ const newPath = path.join(sessionsDir, `${command.newName}.json`);
1382
+ if (!fs.existsSync(oldPath)) {
1383
+ return errorResponse(command.id, `State file not found: ${command.oldName}.json`);
1384
+ }
1385
+ if (fs.existsSync(newPath)) {
1386
+ return errorResponse(command.id, `Destination already exists: ${command.newName}.json`);
1387
+ }
1388
+ fs.renameSync(oldPath, newPath);
1389
+ return successResponse(command.id, {
1390
+ renamed: true,
1391
+ oldName: `${command.oldName}.json`,
1392
+ newName: `${command.newName}.json`,
1393
+ path: newPath,
1394
+ });
1395
+ }
1396
+ async function handleConsole(command, browser) {
1397
+ if (command.clear) {
1398
+ browser.clearConsoleMessages();
1399
+ return successResponse(command.id, { cleared: true });
1400
+ }
1401
+ const messages = browser.getConsoleMessages();
1402
+ return successResponse(command.id, { messages });
1403
+ }
1404
+ async function handleErrors(command, browser) {
1405
+ if (command.clear) {
1406
+ browser.clearPageErrors();
1407
+ return successResponse(command.id, { cleared: true });
1408
+ }
1409
+ const errors = browser.getPageErrors();
1410
+ return successResponse(command.id, { errors });
1411
+ }
1412
+ async function handleKeyboard(command, browser) {
1413
+ const page = browser.getPage();
1414
+ const sub = command.subaction ?? 'press';
1415
+ switch (sub) {
1416
+ case 'type': {
1417
+ const text = command.text ?? '';
1418
+ if (command.delay) {
1419
+ for (const char of text) {
1420
+ const jitter = command.delay * (0.6 + Math.random() * 0.8);
1421
+ await page.keyboard.type(char, { delay: 0 });
1422
+ await page.waitForTimeout(jitter);
1423
+ }
1424
+ }
1425
+ else {
1426
+ await page.keyboard.type(text);
1427
+ }
1428
+ return successResponse(command.id, { typed: true, text: command.text });
1429
+ }
1430
+ case 'press':
1431
+ await page.keyboard.press(command.keys ?? '');
1432
+ return successResponse(command.id, { pressed: command.keys });
1433
+ case 'insertText':
1434
+ await page.keyboard.insertText(command.text ?? '');
1435
+ return successResponse(command.id, { inserted: true, text: command.text });
1436
+ default:
1437
+ return errorResponse(command.id, `Unknown keyboard subaction: ${sub}`);
1438
+ }
1439
+ }
1440
+ async function handleWheel(command, browser) {
1441
+ const page = browser.getPage();
1442
+ if (command.selector) {
1443
+ const element = page.locator(command.selector);
1444
+ await element.hover();
1445
+ }
1446
+ await page.mouse.wheel(command.deltaX ?? 0, command.deltaY ?? 0);
1447
+ return successResponse(command.id, { scrolled: true });
1448
+ }
1449
+ async function handleTap(command, browser) {
1450
+ const page = browser.getPage();
1451
+ await page.tap(command.selector);
1452
+ return successResponse(command.id, { tapped: true });
1453
+ }
1454
+ async function handleClipboard(command, browser) {
1455
+ const page = browser.getPage();
1456
+ switch (command.operation) {
1457
+ case 'copy':
1458
+ await page.keyboard.press('Control+c');
1459
+ return successResponse(command.id, { copied: true });
1460
+ case 'paste':
1461
+ await page.keyboard.press('Control+v');
1462
+ return successResponse(command.id, { pasted: true });
1463
+ case 'read':
1464
+ const text = await page.evaluate('navigator.clipboard.readText()');
1465
+ return successResponse(command.id, { text });
1466
+ default:
1467
+ return errorResponse(command.id, 'Unknown clipboard operation');
1468
+ }
1469
+ }
1470
+ async function handleHighlight(command, browser) {
1471
+ const page = browser.getPage();
1472
+ await page.locator(command.selector).highlight();
1473
+ return successResponse(command.id, { highlighted: true });
1474
+ }
1475
+ async function handleClear(command, browser) {
1476
+ const page = browser.getPage();
1477
+ await page.locator(command.selector).clear();
1478
+ return successResponse(command.id, { cleared: true });
1479
+ }
1480
+ async function handleSelectAll(command, browser) {
1481
+ const page = browser.getPage();
1482
+ await page.locator(command.selector).selectText();
1483
+ return successResponse(command.id, { selected: true });
1484
+ }
1485
+ async function handleInnerText(command, browser) {
1486
+ const page = browser.getPage();
1487
+ const text = await page.locator(command.selector).innerText();
1488
+ return successResponse(command.id, { text });
1489
+ }
1490
+ async function handleInnerHtml(command, browser) {
1491
+ const page = browser.getPage();
1492
+ const html = await page.locator(command.selector).innerHTML();
1493
+ return successResponse(command.id, { html });
1494
+ }
1495
+ async function handleInputValue(command, browser) {
1496
+ const locator = browser.getLocator(command.selector);
1497
+ const value = await locator.inputValue();
1498
+ return successResponse(command.id, { value });
1499
+ }
1500
+ async function handleSetValue(command, browser) {
1501
+ const page = browser.getPage();
1502
+ await page.locator(command.selector).fill(command.value);
1503
+ return successResponse(command.id, { set: true });
1504
+ }
1505
+ async function handleDispatch(command, browser) {
1506
+ const page = browser.getPage();
1507
+ await page.locator(command.selector).dispatchEvent(command.event, command.eventInit);
1508
+ return successResponse(command.id, { dispatched: command.event });
1509
+ }
1510
+ async function handleEvalHandle(command, browser) {
1511
+ const page = browser.getPage();
1512
+ const handle = await page.evaluateHandle(command.script);
1513
+ const result = await handle.jsonValue().catch(() => 'Handle (non-serializable)');
1514
+ return successResponse(command.id, { result });
1515
+ }
1516
+ async function handleExpose(command, browser) {
1517
+ const page = browser.getPage();
1518
+ await page.exposeFunction(command.name, () => {
1519
+ // Exposed function - can be extended
1520
+ return `Function ${command.name} called`;
1521
+ });
1522
+ return successResponse(command.id, { exposed: command.name });
1523
+ }
1524
+ async function handleAddScript(command, browser) {
1525
+ const page = browser.getPage();
1526
+ if (command.content) {
1527
+ await page.addScriptTag({ content: command.content });
1528
+ }
1529
+ else if (command.url) {
1530
+ await page.addScriptTag({ url: command.url });
1531
+ }
1532
+ return successResponse(command.id, { added: true });
1533
+ }
1534
+ async function handleAddStyle(command, browser) {
1535
+ const page = browser.getPage();
1536
+ if (command.content) {
1537
+ await page.addStyleTag({ content: command.content });
1538
+ }
1539
+ else if (command.url) {
1540
+ await page.addStyleTag({ url: command.url });
1541
+ }
1542
+ return successResponse(command.id, { added: true });
1543
+ }
1544
+ async function handleEmulateMedia(command, browser) {
1545
+ const page = browser.getPage();
1546
+ await page.emulateMedia({
1547
+ media: command.media,
1548
+ colorScheme: command.colorScheme,
1549
+ reducedMotion: command.reducedMotion,
1550
+ forcedColors: command.forcedColors,
1551
+ });
1552
+ if (command.colorScheme) {
1553
+ browser.setColorScheme(command.colorScheme);
1554
+ }
1555
+ return successResponse(command.id, { emulated: true });
1556
+ }
1557
+ async function handleOffline(command, browser) {
1558
+ await browser.setOffline(command.offline);
1559
+ return successResponse(command.id, { offline: command.offline });
1560
+ }
1561
+ async function handleHeaders(command, browser) {
1562
+ await browser.setExtraHeaders(command.headers);
1563
+ return successResponse(command.id, { set: true });
1564
+ }
1565
+ async function handlePause(command, browser) {
1566
+ const page = browser.getPage();
1567
+ await page.pause();
1568
+ return successResponse(command.id, { paused: true });
1569
+ }
1570
+ async function handleGetByAltText(command, browser) {
1571
+ const page = browser.getPage();
1572
+ const locator = page.getByAltText(command.text, { exact: command.exact });
1573
+ switch (command.subaction) {
1574
+ case 'click':
1575
+ await locator.click();
1576
+ return successResponse(command.id, { clicked: true });
1577
+ case 'hover':
1578
+ await locator.hover();
1579
+ return successResponse(command.id, { hovered: true });
1580
+ }
1581
+ }
1582
+ async function handleGetByTitle(command, browser) {
1583
+ const page = browser.getPage();
1584
+ const locator = page.getByTitle(command.text, { exact: command.exact });
1585
+ switch (command.subaction) {
1586
+ case 'click':
1587
+ await locator.click();
1588
+ return successResponse(command.id, { clicked: true });
1589
+ case 'hover':
1590
+ await locator.hover();
1591
+ return successResponse(command.id, { hovered: true });
1592
+ }
1593
+ }
1594
+ async function handleGetByTestId(command, browser) {
1595
+ const page = browser.getPage();
1596
+ const locator = page.getByTestId(command.testId);
1597
+ switch (command.subaction) {
1598
+ case 'click':
1599
+ await locator.click();
1600
+ return successResponse(command.id, { clicked: true });
1601
+ case 'fill':
1602
+ await locator.fill(command.value ?? '');
1603
+ return successResponse(command.id, { filled: true });
1604
+ case 'check':
1605
+ await locator.check();
1606
+ return successResponse(command.id, { checked: true });
1607
+ case 'hover':
1608
+ await locator.hover();
1609
+ return successResponse(command.id, { hovered: true });
1610
+ }
1611
+ }
1612
+ async function handleNth(command, browser) {
1613
+ const page = browser.getPage();
1614
+ const base = page.locator(command.selector);
1615
+ const locator = command.index === -1 ? base.last() : base.nth(command.index);
1616
+ switch (command.subaction) {
1617
+ case 'click':
1618
+ await locator.click();
1619
+ return successResponse(command.id, { clicked: true });
1620
+ case 'fill':
1621
+ await locator.fill(command.value ?? '');
1622
+ return successResponse(command.id, { filled: true });
1623
+ case 'check':
1624
+ await locator.check();
1625
+ return successResponse(command.id, { checked: true });
1626
+ case 'hover':
1627
+ await locator.hover();
1628
+ return successResponse(command.id, { hovered: true });
1629
+ case 'text':
1630
+ const text = await locator.textContent();
1631
+ return successResponse(command.id, { text });
1632
+ }
1633
+ }
1634
+ async function handleWaitForUrl(command, browser) {
1635
+ const page = browser.getPage();
1636
+ await page.waitForURL(command.url, { timeout: command.timeout });
1637
+ return successResponse(command.id, { url: page.url() });
1638
+ }
1639
+ async function handleWaitForLoadState(command, browser) {
1640
+ const page = browser.getPage();
1641
+ await page.waitForLoadState(command.state, { timeout: command.timeout });
1642
+ return successResponse(command.id, { state: command.state });
1643
+ }
1644
+ async function handleSetContent(command, browser) {
1645
+ const page = browser.getPage();
1646
+ await page.setContent(command.html);
1647
+ return successResponse(command.id, { set: true });
1648
+ }
1649
+ async function handleTimezone(command, browser) {
1650
+ // Timezone must be set at context level before navigation
1651
+ // This is a limitation - it sets for the current context
1652
+ const page = browser.getPage();
1653
+ await page.context().setGeolocation({ latitude: 0, longitude: 0 }); // Trigger context awareness
1654
+ return successResponse(command.id, {
1655
+ note: 'Timezone must be set at browser launch. Use --timezone flag.',
1656
+ timezone: command.timezone,
1657
+ });
1658
+ }
1659
+ async function handleLocale(command, browser) {
1660
+ // Locale must be set at context creation
1661
+ return successResponse(command.id, {
1662
+ note: 'Locale must be set at browser launch. Use --locale flag.',
1663
+ locale: command.locale,
1664
+ });
1665
+ }
1666
+ async function handleCredentials(command, browser) {
1667
+ const context = browser.getPage().context();
1668
+ await context.setHTTPCredentials({
1669
+ username: command.username,
1670
+ password: command.password,
1671
+ });
1672
+ return successResponse(command.id, { set: true });
1673
+ }
1674
+ async function handleMouseMove(command, browser) {
1675
+ const page = browser.getPage();
1676
+ await page.mouse.move(command.x, command.y);
1677
+ return successResponse(command.id, { moved: true, x: command.x, y: command.y });
1678
+ }
1679
+ async function handleMouseDown(command, browser) {
1680
+ const page = browser.getPage();
1681
+ await page.mouse.down({ button: command.button ?? 'left' });
1682
+ return successResponse(command.id, { down: true });
1683
+ }
1684
+ async function handleMouseUp(command, browser) {
1685
+ const page = browser.getPage();
1686
+ await page.mouse.up({ button: command.button ?? 'left' });
1687
+ return successResponse(command.id, { up: true });
1688
+ }
1689
+ async function handleBringToFront(command, browser) {
1690
+ const page = browser.getPage();
1691
+ await page.bringToFront();
1692
+ return successResponse(command.id, { focused: true });
1693
+ }
1694
+ async function handleWaitForFunction(command, browser) {
1695
+ const page = browser.getPage();
1696
+ await page.waitForFunction(command.expression, { timeout: command.timeout });
1697
+ return successResponse(command.id, { waited: true });
1698
+ }
1699
+ async function handleScrollIntoView(command, browser) {
1700
+ await browser.getLocator(command.selector).scrollIntoViewIfNeeded();
1701
+ return successResponse(command.id, { scrolled: true });
1702
+ }
1703
+ async function handleAddInitScript(command, browser) {
1704
+ const context = browser.getPage().context();
1705
+ await context.addInitScript(command.script);
1706
+ return successResponse(command.id, { added: true });
1707
+ }
1708
+ async function handleKeyDown(command, browser) {
1709
+ const page = browser.getPage();
1710
+ await page.keyboard.down(command.key);
1711
+ return successResponse(command.id, { down: true, key: command.key });
1712
+ }
1713
+ async function handleKeyUp(command, browser) {
1714
+ const page = browser.getPage();
1715
+ await page.keyboard.up(command.key);
1716
+ return successResponse(command.id, { up: true, key: command.key });
1717
+ }
1718
+ async function handleInsertText(command, browser) {
1719
+ const page = browser.getPage();
1720
+ await page.keyboard.insertText(command.text);
1721
+ return successResponse(command.id, { inserted: true });
1722
+ }
1723
+ async function handleMultiSelect(command, browser) {
1724
+ const page = browser.getPage();
1725
+ const selected = await page.locator(command.selector).selectOption(command.values);
1726
+ return successResponse(command.id, { selected });
1727
+ }
1728
+ async function handleWaitForDownload(command, browser) {
1729
+ const page = browser.getPage();
1730
+ const download = await page.waitForEvent('download', { timeout: command.timeout });
1731
+ let filePath;
1732
+ if (command.path) {
1733
+ filePath = command.path;
1734
+ await download.saveAs(filePath);
1735
+ }
1736
+ else {
1737
+ filePath = (await download.path()) || download.suggestedFilename();
1738
+ }
1739
+ return successResponse(command.id, {
1740
+ path: filePath,
1741
+ filename: download.suggestedFilename(),
1742
+ url: download.url(),
1743
+ });
1744
+ }
1745
+ async function handleResponseBody(command, browser) {
1746
+ const page = browser.getPage();
1747
+ const response = await page.waitForResponse((resp) => resp.url().includes(command.url), {
1748
+ timeout: command.timeout,
1749
+ });
1750
+ const body = await response.text();
1751
+ let parsed = body;
1752
+ try {
1753
+ parsed = JSON.parse(body);
1754
+ }
1755
+ catch {
1756
+ // Keep as string if not JSON
1757
+ }
1758
+ return successResponse(command.id, {
1759
+ url: response.url(),
1760
+ status: response.status(),
1761
+ body: parsed,
1762
+ });
1763
+ }
1764
+ // Screencast and input injection handlers
1765
+ async function handleScreencastStart(command, browser) {
1766
+ if (!screencastFrameCallback) {
1767
+ throw new Error('Screencast frame callback not set. Start the streaming server first.');
1768
+ }
1769
+ await browser.startScreencast(screencastFrameCallback, {
1770
+ format: command.format,
1771
+ quality: command.quality,
1772
+ maxWidth: command.maxWidth,
1773
+ maxHeight: command.maxHeight,
1774
+ everyNthFrame: command.everyNthFrame,
1775
+ });
1776
+ return successResponse(command.id, {
1777
+ started: true,
1778
+ format: command.format ?? 'jpeg',
1779
+ quality: command.quality ?? 80,
1780
+ });
1781
+ }
1782
+ async function handleScreencastStop(command, browser) {
1783
+ await browser.stopScreencast();
1784
+ return successResponse(command.id, { stopped: true });
1785
+ }
1786
+ async function handleInputMouse(command, browser) {
1787
+ await browser.injectMouseEvent({
1788
+ type: command.type,
1789
+ x: command.x,
1790
+ y: command.y,
1791
+ button: command.button,
1792
+ clickCount: command.clickCount,
1793
+ deltaX: command.deltaX,
1794
+ deltaY: command.deltaY,
1795
+ modifiers: command.modifiers,
1796
+ });
1797
+ return successResponse(command.id, { injected: true });
1798
+ }
1799
+ async function handleInputKeyboard(command, browser) {
1800
+ await browser.injectKeyboardEvent({
1801
+ type: command.type,
1802
+ key: command.key,
1803
+ code: command.code,
1804
+ text: command.text,
1805
+ modifiers: command.modifiers,
1806
+ });
1807
+ return successResponse(command.id, { injected: true });
1808
+ }
1809
+ async function handleInputTouch(command, browser) {
1810
+ await browser.injectTouchEvent({
1811
+ type: command.type,
1812
+ touchPoints: command.touchPoints,
1813
+ modifiers: command.modifiers,
1814
+ });
1815
+ return successResponse(command.id, { injected: true });
1816
+ }
1817
+ // Recording handlers (Playwright native video recording)
1818
+ async function handleRecordingStart(command, browser) {
1819
+ await browser.startRecording(command.path, command.url);
1820
+ return successResponse(command.id, {
1821
+ started: true,
1822
+ path: command.path,
1823
+ });
1824
+ }
1825
+ async function handleRecordingStop(command, browser) {
1826
+ const result = await browser.stopRecording();
1827
+ return successResponse(command.id, result);
1828
+ }
1829
+ async function handleRecordingRestart(command, browser) {
1830
+ const result = await browser.restartRecording(command.path, command.url);
1831
+ return successResponse(command.id, {
1832
+ started: true,
1833
+ path: command.path,
1834
+ previousPath: result.previousPath,
1835
+ stopped: result.stopped,
1836
+ });
1837
+ }
1838
+ // Diff handlers
1839
+ async function handleDiffSnapshot(command, browser) {
1840
+ let before;
1841
+ if (command.baseline) {
1842
+ try {
1843
+ before = fs.readFileSync(command.baseline, 'utf-8');
1844
+ }
1845
+ catch {
1846
+ return errorResponse(command.id, `Cannot read baseline file: ${command.baseline}`);
1847
+ }
1848
+ }
1849
+ else {
1850
+ before = browser.getLastSnapshot();
1851
+ if (!before) {
1852
+ return errorResponse(command.id, 'No previous snapshot in this session. Take a snapshot first, or use --baseline <file>.');
1853
+ }
1854
+ }
1855
+ const page = browser.getPage();
1856
+ const { tree } = await getEnhancedSnapshot(page, {
1857
+ selector: command.selector,
1858
+ compact: command.compact,
1859
+ maxDepth: command.maxDepth,
1860
+ });
1861
+ const after = tree || 'Empty page';
1862
+ const result = diffSnapshots(before, after);
1863
+ browser.setLastSnapshot(after);
1864
+ return successResponse(command.id, result);
1865
+ }
1866
+ async function handleDiffScreenshot(command, browser) {
1867
+ if (!fs.existsSync(command.baseline)) {
1868
+ return errorResponse(command.id, `Baseline file not found: ${command.baseline}`);
1869
+ }
1870
+ const page = browser.getPage();
1871
+ let screenshotBuffer;
1872
+ if (command.selector) {
1873
+ const locator = browser.getLocatorFromRef(command.selector) || page.locator(command.selector);
1874
+ screenshotBuffer = await locator.screenshot({ type: 'png' });
1875
+ }
1876
+ else {
1877
+ screenshotBuffer = await page.screenshot({ fullPage: command.fullPage, type: 'png' });
1878
+ }
1879
+ const baselineBuffer = fs.readFileSync(command.baseline);
1880
+ const ext = path.extname(command.baseline).toLowerCase();
1881
+ const baselineMime = ext === '.jpg' || ext === '.jpeg' ? 'image/jpeg' : 'image/png';
1882
+ const result = await diffScreenshots(page.context(), baselineBuffer, screenshotBuffer, {
1883
+ threshold: command.threshold,
1884
+ outputPath: command.output,
1885
+ baselineMime,
1886
+ });
1887
+ return successResponse(command.id, result);
1888
+ }
1889
+ async function handleDiffUrl(command, browser) {
1890
+ const page = browser.getPage();
1891
+ const waitUntil = command.waitUntil ?? 'load';
1892
+ const snapshotOpts = {
1893
+ selector: command.selector,
1894
+ compact: command.compact,
1895
+ maxDepth: command.maxDepth,
1896
+ };
1897
+ // Capture state of url1
1898
+ await page.goto(command.url1, { waitUntil });
1899
+ const { tree: tree1 } = await getEnhancedSnapshot(page, snapshotOpts);
1900
+ const snapshot1 = tree1 || 'Empty page';
1901
+ let screenshot1;
1902
+ if (command.screenshot) {
1903
+ screenshot1 = await page.screenshot({ fullPage: command.fullPage, type: 'png' });
1904
+ }
1905
+ // Capture state of url2
1906
+ await page.goto(command.url2, { waitUntil });
1907
+ const { tree: tree2 } = await getEnhancedSnapshot(page, snapshotOpts);
1908
+ const snapshot2 = tree2 || 'Empty page';
1909
+ const snapshotDiff = diffSnapshots(snapshot1, snapshot2);
1910
+ const result = { snapshot: snapshotDiff };
1911
+ if (command.screenshot && screenshot1) {
1912
+ const screenshot2 = await page.screenshot({ fullPage: command.fullPage, type: 'png' });
1913
+ result.screenshot = await diffScreenshots(page.context(), screenshot1, screenshot2, {});
1914
+ }
1915
+ return successResponse(command.id, result);
1916
+ }
1917
+ //# sourceMappingURL=actions.js.map