nstbrowser-ai-agent 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (119) hide show
  1. package/LICENSE +201 -0
  2. package/README.md +1321 -0
  3. package/bin/nstbrowser-ai-agent-darwin-arm64 +0 -0
  4. package/bin/nstbrowser-ai-agent-darwin-x64 +0 -0
  5. package/bin/nstbrowser-ai-agent-linux-arm64 +0 -0
  6. package/bin/nstbrowser-ai-agent-linux-x64 +0 -0
  7. package/bin/nstbrowser-ai-agent-win32-x64.exe +0 -0
  8. package/bin/nstbrowser-ai-agent.js +109 -0
  9. package/dist/action-policy.d.ts +14 -0
  10. package/dist/action-policy.d.ts.map +1 -0
  11. package/dist/action-policy.js +253 -0
  12. package/dist/action-policy.js.map +1 -0
  13. package/dist/actions.d.ts +18 -0
  14. package/dist/actions.d.ts.map +1 -0
  15. package/dist/actions.js +2037 -0
  16. package/dist/actions.js.map +1 -0
  17. package/dist/auth-cli.d.ts +2 -0
  18. package/dist/auth-cli.d.ts.map +1 -0
  19. package/dist/auth-cli.js +97 -0
  20. package/dist/auth-cli.js.map +1 -0
  21. package/dist/auth-vault.d.ts +36 -0
  22. package/dist/auth-vault.d.ts.map +1 -0
  23. package/dist/auth-vault.js +125 -0
  24. package/dist/auth-vault.js.map +1 -0
  25. package/dist/browser.d.ts +573 -0
  26. package/dist/browser.d.ts.map +1 -0
  27. package/dist/browser.js +2036 -0
  28. package/dist/browser.js.map +1 -0
  29. package/dist/confirmation.d.ts +8 -0
  30. package/dist/confirmation.d.ts.map +1 -0
  31. package/dist/confirmation.js +30 -0
  32. package/dist/confirmation.js.map +1 -0
  33. package/dist/daemon.d.ts +65 -0
  34. package/dist/daemon.d.ts.map +1 -0
  35. package/dist/daemon.js +589 -0
  36. package/dist/daemon.js.map +1 -0
  37. package/dist/diff.d.ts +18 -0
  38. package/dist/diff.d.ts.map +1 -0
  39. package/dist/diff.js +271 -0
  40. package/dist/diff.js.map +1 -0
  41. package/dist/domain-filter.d.ts +28 -0
  42. package/dist/domain-filter.d.ts.map +1 -0
  43. package/dist/domain-filter.js +149 -0
  44. package/dist/domain-filter.js.map +1 -0
  45. package/dist/encryption.d.ts +73 -0
  46. package/dist/encryption.d.ts.map +1 -0
  47. package/dist/encryption.js +171 -0
  48. package/dist/encryption.js.map +1 -0
  49. package/dist/ios-actions.d.ts +11 -0
  50. package/dist/ios-actions.d.ts.map +1 -0
  51. package/dist/ios-actions.js +228 -0
  52. package/dist/ios-actions.js.map +1 -0
  53. package/dist/ios-manager.d.ts +266 -0
  54. package/dist/ios-manager.d.ts.map +1 -0
  55. package/dist/ios-manager.js +1073 -0
  56. package/dist/ios-manager.js.map +1 -0
  57. package/dist/nstbrowser-actions.d.ts +10 -0
  58. package/dist/nstbrowser-actions.d.ts.map +1 -0
  59. package/dist/nstbrowser-actions.js +277 -0
  60. package/dist/nstbrowser-actions.js.map +1 -0
  61. package/dist/nstbrowser-client.d.ts +197 -0
  62. package/dist/nstbrowser-client.d.ts.map +1 -0
  63. package/dist/nstbrowser-client.js +454 -0
  64. package/dist/nstbrowser-client.js.map +1 -0
  65. package/dist/nstbrowser-errors.d.ts +28 -0
  66. package/dist/nstbrowser-errors.d.ts.map +1 -0
  67. package/dist/nstbrowser-errors.js +59 -0
  68. package/dist/nstbrowser-errors.js.map +1 -0
  69. package/dist/nstbrowser-profile-resolver.d.ts +89 -0
  70. package/dist/nstbrowser-profile-resolver.d.ts.map +1 -0
  71. package/dist/nstbrowser-profile-resolver.js +227 -0
  72. package/dist/nstbrowser-profile-resolver.js.map +1 -0
  73. package/dist/nstbrowser-types.d.ts +151 -0
  74. package/dist/nstbrowser-types.d.ts.map +1 -0
  75. package/dist/nstbrowser-types.js +5 -0
  76. package/dist/nstbrowser-types.js.map +1 -0
  77. package/dist/nstbrowser-utils.d.ts +71 -0
  78. package/dist/nstbrowser-utils.d.ts.map +1 -0
  79. package/dist/nstbrowser-utils.js +174 -0
  80. package/dist/nstbrowser-utils.js.map +1 -0
  81. package/dist/protocol.d.ts +26 -0
  82. package/dist/protocol.d.ts.map +1 -0
  83. package/dist/protocol.js +1245 -0
  84. package/dist/protocol.js.map +1 -0
  85. package/dist/snapshot.d.ts +67 -0
  86. package/dist/snapshot.d.ts.map +1 -0
  87. package/dist/snapshot.js +514 -0
  88. package/dist/snapshot.js.map +1 -0
  89. package/dist/state-utils.d.ts +77 -0
  90. package/dist/state-utils.d.ts.map +1 -0
  91. package/dist/state-utils.js +178 -0
  92. package/dist/state-utils.js.map +1 -0
  93. package/dist/stream-server.d.ts +117 -0
  94. package/dist/stream-server.d.ts.map +1 -0
  95. package/dist/stream-server.js +309 -0
  96. package/dist/stream-server.js.map +1 -0
  97. package/dist/types.d.ts +1121 -0
  98. package/dist/types.d.ts.map +1 -0
  99. package/dist/types.js +2 -0
  100. package/dist/types.js.map +1 -0
  101. package/package.json +83 -0
  102. package/scripts/analyze-api-coverage.js +205 -0
  103. package/scripts/analyze-cli-coverage.js +239 -0
  104. package/scripts/build-all-platforms.sh +68 -0
  105. package/scripts/check-version-sync.js +39 -0
  106. package/scripts/copy-native.js +36 -0
  107. package/scripts/download-nstbrowser-docs.js +152 -0
  108. package/scripts/generate-skills.sh +218 -0
  109. package/scripts/postinstall.js +231 -0
  110. package/scripts/sync-version.js +69 -0
  111. package/skills/nstbrowser-ai-agent/SKILL.md +759 -0
  112. package/skills/nstbrowser-ai-agent/references/batch-operations.md +414 -0
  113. package/skills/nstbrowser-ai-agent/references/nst-api-reference.md +960 -0
  114. package/skills/nstbrowser-ai-agent/references/profile-management.md +672 -0
  115. package/skills/nstbrowser-ai-agent/references/proxy-configuration.md +460 -0
  116. package/skills/nstbrowser-ai-agent/references/troubleshooting.md +773 -0
  117. package/skills/nstbrowser-ai-agent/templates/automated-workflow.sh +248 -0
  118. package/skills/nstbrowser-ai-agent/templates/batch-proxy-update.sh +257 -0
  119. package/skills/nstbrowser-ai-agent/templates/profile-setup.sh +248 -0
@@ -0,0 +1,2037 @@
1
+ import * as fs from 'fs';
2
+ import * as path from 'path';
3
+ import { mkdirSync } from 'node:fs';
4
+ import { getAppDir } from './daemon.js';
5
+ import { checkPolicy, describeAction, getActionCategory, loadPolicyFile, initPolicyReloader, reloadPolicyIfChanged, } from './action-policy.js';
6
+ import { requestConfirmation, getAndRemovePending } from './confirmation.js';
7
+ import { getAuthProfile, updateLastLogin } from './auth-vault.js';
8
+ import { getSessionsDir, readStateFile, isValidSessionName, isEncryptedPayload, listStateFiles, cleanupExpiredStates, } from './state-utils.js';
9
+ import { successResponse, errorResponse, parseCommand } from './protocol.js';
10
+ import { diffSnapshots, diffScreenshots } from './diff.js';
11
+ import { getEnhancedSnapshot } from './snapshot.js';
12
+ // Callback for screencast frames - will be set by the daemon when streaming is active
13
+ let screencastFrameCallback = null;
14
+ /**
15
+ * Set the callback for screencast frames
16
+ * This is called by the daemon to set up frame streaming
17
+ */
18
+ export function setScreencastFrameCallback(callback) {
19
+ screencastFrameCallback = callback;
20
+ }
21
+ /**
22
+ * Convert Playwright errors to AI-friendly messages
23
+ * @internal Exported for testing
24
+ */
25
+ export function toAIFriendlyError(error, selector) {
26
+ const message = error instanceof Error ? error.message : String(error);
27
+ // Handle strict mode violation (multiple elements match)
28
+ if (message.includes('strict mode violation')) {
29
+ // Extract count if available
30
+ const countMatch = message.match(/resolved to (\d+) elements/);
31
+ const count = countMatch ? countMatch[1] : 'multiple';
32
+ return new Error(`Selector "${selector}" matched ${count} elements. ` +
33
+ `Run 'snapshot' to get updated refs, or use a more specific CSS selector.`);
34
+ }
35
+ // Handle element not interactable (must be checked BEFORE timeout case)
36
+ // This includes cases where an overlay/modal blocks the element
37
+ if (message.includes('intercepts pointer events')) {
38
+ return new Error(`Element "${selector}" is blocked by another element (likely a modal or overlay). ` +
39
+ `Try dismissing any modals/cookie banners first.`);
40
+ }
41
+ // Handle element not visible
42
+ if (message.includes('not visible') && !message.includes('Timeout')) {
43
+ return new Error(`Element "${selector}" is not visible. ` +
44
+ `Try scrolling it into view or check if it's hidden.`);
45
+ }
46
+ // Handle general timeout (element exists but action couldn't complete)
47
+ if (message.includes('Timeout') && message.includes('exceeded')) {
48
+ return new Error(`Action on "${selector}" timed out. The element may be blocked, still loading, or not interactable. ` +
49
+ `Run 'snapshot' to check the current page state.`);
50
+ }
51
+ // Handle element not found (timeout waiting for element)
52
+ if (message.includes('waiting for') &&
53
+ (message.includes('to be visible') || message.includes('Timeout'))) {
54
+ return new Error(`Element "${selector}" not found or not visible. ` +
55
+ `Run 'snapshot' to see current page elements.`);
56
+ }
57
+ // Return original error for unknown cases
58
+ return error instanceof Error ? error : new Error(message);
59
+ }
60
+ let actionPolicy = null;
61
+ let confirmCategories = new Set();
62
+ export function initActionPolicy() {
63
+ const policyPath = process.env.NSTBROWSER_AI_AGENT_ACTION_POLICY;
64
+ if (policyPath) {
65
+ try {
66
+ actionPolicy = loadPolicyFile(policyPath);
67
+ initPolicyReloader(policyPath, actionPolicy);
68
+ }
69
+ catch (err) {
70
+ console.error(`[ERROR] Failed to load action policy from ${policyPath}: ${err instanceof Error ? err.message : err}`);
71
+ process.exit(1);
72
+ }
73
+ }
74
+ const confirmActionsEnv = process.env.NSTBROWSER_AI_AGENT_CONFIRM_ACTIONS;
75
+ if (confirmActionsEnv) {
76
+ confirmCategories = new Set(confirmActionsEnv
77
+ .split(',')
78
+ .map((c) => c.trim().toLowerCase())
79
+ .filter((c) => c.length > 0));
80
+ }
81
+ }
82
+ /**
83
+ * Execute a command and return a response
84
+ */
85
+ export async function executeCommand(command, browser) {
86
+ try {
87
+ // Handle confirm/deny actions (bypass policy check)
88
+ if (command.action === 'confirm') {
89
+ return await handleConfirm(command, browser);
90
+ }
91
+ if (command.action === 'deny') {
92
+ return handleDeny(command);
93
+ }
94
+ // Hot-reload policy file if it changed on disk
95
+ actionPolicy = reloadPolicyIfChanged();
96
+ // Policy enforcement
97
+ const decision = checkPolicy(command.action, actionPolicy, confirmCategories);
98
+ if (decision === 'deny') {
99
+ const category = getActionCategory(command.action);
100
+ return errorResponse(command.id, `Action denied by policy: '${category}' is not allowed`);
101
+ }
102
+ if (decision === 'confirm') {
103
+ const category = getActionCategory(command.action);
104
+ const description = describeAction(command.action, command);
105
+ const { confirmationId } = requestConfirmation(command.action, category, description, command);
106
+ return successResponse(command.id, {
107
+ confirmation_required: true,
108
+ action: command.action,
109
+ category,
110
+ description,
111
+ confirmation_id: confirmationId,
112
+ });
113
+ }
114
+ return await dispatchAction(command, browser);
115
+ }
116
+ catch (error) {
117
+ const message = error instanceof Error ? error.message : String(error);
118
+ return errorResponse(command.id, message);
119
+ }
120
+ }
121
+ /**
122
+ * Dispatch a command to its handler after policy checks have passed.
123
+ */
124
+ async function dispatchAction(command, browser) {
125
+ switch (command.action) {
126
+ case 'launch':
127
+ return await handleLaunch(command, browser);
128
+ case 'navigate':
129
+ return await handleNavigate(command, browser);
130
+ case 'click':
131
+ return await handleClick(command, browser);
132
+ case 'type':
133
+ return await handleType(command, browser);
134
+ case 'fill':
135
+ return await handleFill(command, browser);
136
+ case 'check':
137
+ return await handleCheck(command, browser);
138
+ case 'uncheck':
139
+ return await handleUncheck(command, browser);
140
+ case 'upload':
141
+ return await handleUpload(command, browser);
142
+ case 'dblclick':
143
+ return await handleDoubleClick(command, browser);
144
+ case 'focus':
145
+ return await handleFocus(command, browser);
146
+ case 'drag':
147
+ return await handleDrag(command, browser);
148
+ case 'frame':
149
+ return await handleFrame(command, browser);
150
+ case 'mainframe':
151
+ return await handleMainFrame(command, browser);
152
+ case 'getbyrole':
153
+ return await handleGetByRole(command, browser);
154
+ case 'getbytext':
155
+ return await handleGetByText(command, browser);
156
+ case 'getbylabel':
157
+ return await handleGetByLabel(command, browser);
158
+ case 'getbyplaceholder':
159
+ return await handleGetByPlaceholder(command, browser);
160
+ case 'press':
161
+ return await handlePress(command, browser);
162
+ case 'screenshot':
163
+ return await handleScreenshot(command, browser);
164
+ case 'snapshot':
165
+ return await handleSnapshot(command, browser);
166
+ case 'evaluate':
167
+ return await handleEvaluate(command, browser);
168
+ case 'wait':
169
+ return await handleWait(command, browser);
170
+ case 'scroll':
171
+ return await handleScroll(command, browser);
172
+ case 'select':
173
+ return await handleSelect(command, browser);
174
+ case 'hover':
175
+ return await handleHover(command, browser);
176
+ case 'content':
177
+ return await handleContent(command, browser);
178
+ case 'close':
179
+ return await handleClose(command, browser);
180
+ case 'tab_new':
181
+ return await handleTabNew(command, browser);
182
+ case 'tab_list':
183
+ return await handleTabList(command, browser);
184
+ case 'tab_switch':
185
+ return await handleTabSwitch(command, browser);
186
+ case 'tab_close':
187
+ return await handleTabClose(command, browser);
188
+ case 'window_new':
189
+ return await handleWindowNew(command, browser);
190
+ case 'cookies_get':
191
+ return await handleCookiesGet(command, browser);
192
+ case 'cookies_set':
193
+ return await handleCookiesSet(command, browser);
194
+ case 'cookies_clear':
195
+ return await handleCookiesClear(command, browser);
196
+ case 'storage_get':
197
+ return await handleStorageGet(command, browser);
198
+ case 'storage_set':
199
+ return await handleStorageSet(command, browser);
200
+ case 'storage_clear':
201
+ return await handleStorageClear(command, browser);
202
+ case 'dialog':
203
+ return await handleDialog(command, browser);
204
+ case 'pdf':
205
+ return await handlePdf(command, browser);
206
+ case 'route':
207
+ return await handleRoute(command, browser);
208
+ case 'unroute':
209
+ return await handleUnroute(command, browser);
210
+ case 'requests':
211
+ return await handleRequests(command, browser);
212
+ case 'download':
213
+ return await handleDownload(command, browser);
214
+ case 'geolocation':
215
+ return await handleGeolocation(command, browser);
216
+ case 'permissions':
217
+ return await handlePermissions(command, browser);
218
+ case 'viewport':
219
+ return await handleViewport(command, browser);
220
+ case 'useragent':
221
+ return await handleUserAgent(command, browser);
222
+ case 'device':
223
+ return await handleDevice(command, browser);
224
+ case 'back':
225
+ return await handleBack(command, browser);
226
+ case 'forward':
227
+ return await handleForward(command, browser);
228
+ case 'reload':
229
+ return await handleReload(command, browser);
230
+ case 'url':
231
+ return await handleUrl(command, browser);
232
+ case 'title':
233
+ return await handleTitle(command, browser);
234
+ case 'getattribute':
235
+ return await handleGetAttribute(command, browser);
236
+ case 'gettext':
237
+ return await handleGetText(command, browser);
238
+ case 'isvisible':
239
+ return await handleIsVisible(command, browser);
240
+ case 'isenabled':
241
+ return await handleIsEnabled(command, browser);
242
+ case 'ischecked':
243
+ return await handleIsChecked(command, browser);
244
+ case 'count':
245
+ return await handleCount(command, browser);
246
+ case 'boundingbox':
247
+ return await handleBoundingBox(command, browser);
248
+ case 'styles':
249
+ return await handleStyles(command, browser);
250
+ case 'video_start':
251
+ return await handleVideoStart(command, browser);
252
+ case 'video_stop':
253
+ return await handleVideoStop(command, browser);
254
+ case 'trace_start':
255
+ return await handleTraceStart(command, browser);
256
+ case 'trace_stop':
257
+ return await handleTraceStop(command, browser);
258
+ case 'profiler_start':
259
+ return await handleProfilerStart(command, browser);
260
+ case 'profiler_stop':
261
+ return await handleProfilerStop(command, browser);
262
+ case 'har_start':
263
+ return await handleHarStart(command, browser);
264
+ case 'har_stop':
265
+ return await handleHarStop(command, browser);
266
+ case 'state_save':
267
+ return await handleStateSave(command, browser);
268
+ case 'state_load':
269
+ return await handleStateLoad(command, browser);
270
+ case 'state_list':
271
+ return await handleStateList(command);
272
+ case 'state_clear':
273
+ return await handleStateClear(command);
274
+ case 'state_show':
275
+ return await handleStateShow(command);
276
+ case 'state_clean':
277
+ return await handleStateClean(command);
278
+ case 'state_rename':
279
+ return await handleStateRename(command);
280
+ case 'console':
281
+ return await handleConsole(command, browser);
282
+ case 'errors':
283
+ return await handleErrors(command, browser);
284
+ case 'keyboard':
285
+ return await handleKeyboard(command, browser);
286
+ case 'wheel':
287
+ return await handleWheel(command, browser);
288
+ case 'tap':
289
+ return await handleTap(command, browser);
290
+ case 'clipboard':
291
+ return await handleClipboard(command, browser);
292
+ case 'highlight':
293
+ return await handleHighlight(command, browser);
294
+ case 'clear':
295
+ return await handleClear(command, browser);
296
+ case 'selectall':
297
+ return await handleSelectAll(command, browser);
298
+ case 'innertext':
299
+ return await handleInnerText(command, browser);
300
+ case 'innerhtml':
301
+ return await handleInnerHtml(command, browser);
302
+ case 'inputvalue':
303
+ return await handleInputValue(command, browser);
304
+ case 'setvalue':
305
+ return await handleSetValue(command, browser);
306
+ case 'dispatch':
307
+ return await handleDispatch(command, browser);
308
+ case 'evalhandle':
309
+ return await handleEvalHandle(command, browser);
310
+ case 'expose':
311
+ return await handleExpose(command, browser);
312
+ case 'addscript':
313
+ return await handleAddScript(command, browser);
314
+ case 'addstyle':
315
+ return await handleAddStyle(command, browser);
316
+ case 'emulatemedia':
317
+ return await handleEmulateMedia(command, browser);
318
+ case 'offline':
319
+ return await handleOffline(command, browser);
320
+ case 'headers':
321
+ return await handleHeaders(command, browser);
322
+ case 'pause':
323
+ return await handlePause(command, browser);
324
+ case 'getbyalttext':
325
+ return await handleGetByAltText(command, browser);
326
+ case 'getbytitle':
327
+ return await handleGetByTitle(command, browser);
328
+ case 'getbytestid':
329
+ return await handleGetByTestId(command, browser);
330
+ case 'nth':
331
+ return await handleNth(command, browser);
332
+ case 'waitforurl':
333
+ return await handleWaitForUrl(command, browser);
334
+ case 'waitforloadstate':
335
+ return await handleWaitForLoadState(command, browser);
336
+ case 'setcontent':
337
+ return await handleSetContent(command, browser);
338
+ case 'timezone':
339
+ return await handleTimezone(command, browser);
340
+ case 'locale':
341
+ return await handleLocale(command, browser);
342
+ case 'credentials':
343
+ return await handleCredentials(command, browser);
344
+ case 'mousemove':
345
+ return await handleMouseMove(command, browser);
346
+ case 'mousedown':
347
+ return await handleMouseDown(command, browser);
348
+ case 'mouseup':
349
+ return await handleMouseUp(command, browser);
350
+ case 'bringtofront':
351
+ return await handleBringToFront(command, browser);
352
+ case 'waitforfunction':
353
+ return await handleWaitForFunction(command, browser);
354
+ case 'scrollintoview':
355
+ return await handleScrollIntoView(command, browser);
356
+ case 'addinitscript':
357
+ return await handleAddInitScript(command, browser);
358
+ case 'keydown':
359
+ return await handleKeyDown(command, browser);
360
+ case 'keyup':
361
+ return await handleKeyUp(command, browser);
362
+ case 'inserttext':
363
+ return await handleInsertText(command, browser);
364
+ case 'multiselect':
365
+ return await handleMultiSelect(command, browser);
366
+ case 'waitfordownload':
367
+ return await handleWaitForDownload(command, browser);
368
+ case 'responsebody':
369
+ return await handleResponseBody(command, browser);
370
+ case 'screencast_start':
371
+ return await handleScreencastStart(command, browser);
372
+ case 'screencast_stop':
373
+ return await handleScreencastStop(command, browser);
374
+ case 'input_mouse':
375
+ return await handleInputMouse(command, browser);
376
+ case 'input_keyboard':
377
+ return await handleInputKeyboard(command, browser);
378
+ case 'input_touch':
379
+ return await handleInputTouch(command, browser);
380
+ case 'recording_start':
381
+ return await handleRecordingStart(command, browser);
382
+ case 'recording_stop':
383
+ return await handleRecordingStop(command, browser);
384
+ case 'recording_restart':
385
+ return await handleRecordingRestart(command, browser);
386
+ case 'diff_snapshot':
387
+ return await handleDiffSnapshot(command, browser);
388
+ case 'diff_screenshot':
389
+ return await handleDiffScreenshot(command, browser);
390
+ case 'diff_url':
391
+ return await handleDiffUrl(command, browser);
392
+ case 'auth_login':
393
+ return await handleAuthLogin(command, browser);
394
+ default: {
395
+ // TypeScript narrows to never here, but we handle it for safety
396
+ const unknownCommand = command;
397
+ return errorResponse(unknownCommand.id, `Unknown action: ${unknownCommand.action}`);
398
+ }
399
+ }
400
+ }
401
+ async function handleLaunch(command, browser) {
402
+ await browser.launch(command);
403
+ return successResponse(command.id, { launched: true });
404
+ }
405
+ async function handleNavigate(command, browser) {
406
+ browser.checkDomainAllowed(command.url);
407
+ const page = browser.getPage();
408
+ // If headers are provided, set up scoped headers for this origin
409
+ if (command.headers && Object.keys(command.headers).length > 0) {
410
+ await browser.setScopedHeaders(command.url, command.headers);
411
+ }
412
+ await page.goto(command.url, {
413
+ waitUntil: command.waitUntil ?? 'load',
414
+ });
415
+ return successResponse(command.id, {
416
+ url: page.url(),
417
+ title: await page.title(),
418
+ });
419
+ }
420
+ async function handleClick(command, browser) {
421
+ // Support both refs (@e1) and regular selectors
422
+ const locator = browser.getLocator(command.selector);
423
+ try {
424
+ // If --new-tab flag is set, get the href and open in a new tab
425
+ if (command.newTab) {
426
+ const fullUrl = await locator.evaluate((el) => {
427
+ const href = el.getAttribute('href');
428
+ // URL and document.baseURI are available in the browser context
429
+ return href
430
+ ? new globalThis.URL(href, globalThis.document.baseURI).toString()
431
+ : '';
432
+ });
433
+ if (!fullUrl) {
434
+ throw new Error(`Element '${command.selector}' does not have an href attribute. --new-tab only works on links.`);
435
+ }
436
+ await browser.newTab();
437
+ const newPage = browser.getPage();
438
+ await newPage.goto(fullUrl);
439
+ return successResponse(command.id, {
440
+ clicked: true,
441
+ newTab: true,
442
+ url: fullUrl,
443
+ });
444
+ }
445
+ await locator.click({
446
+ button: command.button,
447
+ clickCount: command.clickCount,
448
+ delay: command.delay,
449
+ });
450
+ }
451
+ catch (error) {
452
+ throw toAIFriendlyError(error, command.selector);
453
+ }
454
+ return successResponse(command.id, { clicked: true });
455
+ }
456
+ async function handleType(command, browser) {
457
+ const locator = browser.getLocator(command.selector);
458
+ try {
459
+ if (command.clear) {
460
+ await locator.fill('');
461
+ }
462
+ await locator.pressSequentially(command.text, {
463
+ delay: command.delay,
464
+ });
465
+ }
466
+ catch (error) {
467
+ throw toAIFriendlyError(error, command.selector);
468
+ }
469
+ return successResponse(command.id, { typed: true });
470
+ }
471
+ async function handlePress(command, browser) {
472
+ const page = browser.getPage();
473
+ if (command.selector) {
474
+ await page.press(command.selector, command.key);
475
+ }
476
+ else {
477
+ await page.keyboard.press(command.key);
478
+ }
479
+ return successResponse(command.id, { pressed: true });
480
+ }
481
+ const ANNOTATION_OVERLAY_ID = '__agent_browser_annotations__';
482
+ async function removeAnnotationOverlay(page) {
483
+ await page
484
+ .evaluate(`(() => { const el = document.getElementById(${JSON.stringify(ANNOTATION_OVERLAY_ID)}); if (el) el.remove(); })()`)
485
+ .catch(() => { });
486
+ }
487
+ async function handleScreenshot(command, browser) {
488
+ const page = browser.getPage();
489
+ const options = {
490
+ fullPage: command.fullPage,
491
+ type: command.format ?? 'png',
492
+ };
493
+ if (command.format === 'jpeg' && command.quality !== undefined) {
494
+ options.quality = command.quality;
495
+ }
496
+ let target = page;
497
+ if (command.selector) {
498
+ target = browser.getLocator(command.selector);
499
+ }
500
+ let overlayInjected = false;
501
+ try {
502
+ let savePath = command.path;
503
+ if (!savePath) {
504
+ const ext = command.format === 'jpeg' ? 'jpg' : 'png';
505
+ const timestamp = new Date().toISOString().replace(/[:.]/g, '-');
506
+ const random = Math.random().toString(36).substring(2, 8);
507
+ const filename = `screenshot-${timestamp}-${random}.${ext}`;
508
+ const screenshotDir = path.join(getAppDir(), 'tmp', 'screenshots');
509
+ mkdirSync(screenshotDir, { recursive: true });
510
+ savePath = path.join(screenshotDir, filename);
511
+ }
512
+ let annotations;
513
+ if (command.annotate) {
514
+ const { refs } = await browser.getSnapshot({ interactive: true });
515
+ const entries = Object.entries(refs);
516
+ const results = await Promise.all(entries.map(async ([ref, data]) => {
517
+ try {
518
+ const locator = browser.getLocatorFromRef(ref);
519
+ if (!locator)
520
+ return null;
521
+ const box = await locator.boundingBox();
522
+ if (!box || box.width === 0 || box.height === 0)
523
+ return null;
524
+ const num = parseInt(ref.replace('e', ''), 10);
525
+ return {
526
+ ref,
527
+ number: num,
528
+ role: data.role,
529
+ name: data.name || undefined,
530
+ box: {
531
+ x: Math.round(box.x),
532
+ y: Math.round(box.y),
533
+ width: Math.round(box.width),
534
+ height: Math.round(box.height),
535
+ },
536
+ };
537
+ }
538
+ catch {
539
+ return null;
540
+ }
541
+ }));
542
+ // When a selector is provided the screenshot is cropped to that element,
543
+ // so filter to annotations that overlap the target and shift coordinates.
544
+ let targetBox = null;
545
+ if (command.selector) {
546
+ const raw = await browser.getLocator(command.selector).boundingBox();
547
+ if (raw) {
548
+ targetBox = {
549
+ x: Math.round(raw.x),
550
+ y: Math.round(raw.y),
551
+ width: Math.round(raw.width),
552
+ height: Math.round(raw.height),
553
+ };
554
+ }
555
+ }
556
+ const filtered = results.filter((a) => a !== null);
557
+ // Filter by selector overlap if needed, but keep viewport-relative coords
558
+ // for overlay positioning. Coordinate shifting happens later for metadata only.
559
+ let overlayItems;
560
+ if (targetBox) {
561
+ const tb = targetBox;
562
+ overlayItems = filtered
563
+ .filter((a) => {
564
+ const ax2 = a.box.x + a.box.width;
565
+ const ay2 = a.box.y + a.box.height;
566
+ const bx2 = tb.x + tb.width;
567
+ const by2 = tb.y + tb.height;
568
+ return a.box.x < bx2 && ax2 > tb.x && a.box.y < by2 && ay2 > tb.y;
569
+ })
570
+ .sort((a, b) => a.number - b.number);
571
+ }
572
+ else {
573
+ overlayItems = filtered.sort((a, b) => a.number - b.number);
574
+ }
575
+ if (overlayItems.length > 0) {
576
+ const overlayData = overlayItems.map((a) => ({
577
+ number: a.number,
578
+ x: a.box.x,
579
+ y: a.box.y,
580
+ width: a.box.width,
581
+ height: a.box.height,
582
+ }));
583
+ // Uses position:absolute with document-relative coords so labels render
584
+ // correctly for both viewport and fullPage screenshots, and when the
585
+ // screenshot is scoped to a selector element.
586
+ await page.evaluate(`(() => {
587
+ var items = ${JSON.stringify(overlayData)};
588
+ var id = ${JSON.stringify(ANNOTATION_OVERLAY_ID)};
589
+ var sx = window.scrollX || 0;
590
+ var sy = window.scrollY || 0;
591
+ var c = document.createElement('div');
592
+ c.id = id;
593
+ c.style.cssText = 'position:absolute;top:0;left:0;width:0;height:0;pointer-events:none;z-index:2147483647;';
594
+ for (var i = 0; i < items.length; i++) {
595
+ var it = items[i];
596
+ var dx = it.x + sx;
597
+ var dy = it.y + sy;
598
+ var b = document.createElement('div');
599
+ b.style.cssText = 'position:absolute;left:' + dx + 'px;top:' + dy + 'px;width:' + it.width + 'px;height:' + it.height + 'px;border:2px solid rgba(255,0,0,0.8);box-sizing:border-box;pointer-events:none;';
600
+ var l = document.createElement('div');
601
+ l.textContent = String(it.number);
602
+ var labelTop = dy < 14 ? '2px' : '-14px';
603
+ l.style.cssText = 'position:absolute;top:' + labelTop + ';left:-2px;background:rgba(255,0,0,0.9);color:#fff;font:bold 11px/14px monospace;padding:0 4px;border-radius:2px;white-space:nowrap;';
604
+ b.appendChild(l);
605
+ c.appendChild(b);
606
+ }
607
+ document.documentElement.appendChild(c);
608
+ })()`);
609
+ overlayInjected = true;
610
+ }
611
+ // Build returned annotation metadata with image-relative coordinates.
612
+ // Selector: shift to target-element-relative.
613
+ // fullPage: convert to document-relative (matching fullPage image origin).
614
+ // Default: viewport-relative (unchanged).
615
+ if (targetBox) {
616
+ const tb = targetBox;
617
+ annotations = overlayItems.map((a) => ({
618
+ ...a,
619
+ box: {
620
+ x: a.box.x - tb.x,
621
+ y: a.box.y - tb.y,
622
+ width: a.box.width,
623
+ height: a.box.height,
624
+ },
625
+ }));
626
+ }
627
+ else if (command.fullPage) {
628
+ const scroll = (await page.evaluate(`({x: window.scrollX || 0, y: window.scrollY || 0})`));
629
+ annotations = overlayItems.map((a) => ({
630
+ ...a,
631
+ box: {
632
+ x: a.box.x + scroll.x,
633
+ y: a.box.y + scroll.y,
634
+ width: a.box.width,
635
+ height: a.box.height,
636
+ },
637
+ }));
638
+ }
639
+ else {
640
+ annotations = overlayItems;
641
+ }
642
+ }
643
+ await target.screenshot({ ...options, path: savePath });
644
+ if (overlayInjected) {
645
+ await removeAnnotationOverlay(page);
646
+ }
647
+ return successResponse(command.id, {
648
+ path: savePath,
649
+ ...(annotations && annotations.length > 0 ? { annotations } : {}),
650
+ });
651
+ }
652
+ catch (error) {
653
+ if (overlayInjected) {
654
+ await removeAnnotationOverlay(page);
655
+ }
656
+ if (command.selector) {
657
+ throw toAIFriendlyError(error, command.selector);
658
+ }
659
+ throw error;
660
+ }
661
+ }
662
+ async function handleSnapshot(command, browser) {
663
+ // Use enhanced snapshot with refs and optional filtering
664
+ const { tree, refs } = await browser.getSnapshot({
665
+ interactive: command.interactive,
666
+ cursor: command.cursor,
667
+ maxDepth: command.maxDepth,
668
+ compact: command.compact,
669
+ selector: command.selector,
670
+ });
671
+ // Simplify refs for output (just role and name)
672
+ const simpleRefs = {};
673
+ for (const [ref, data] of Object.entries(refs)) {
674
+ simpleRefs[ref] = { role: data.role, name: data.name };
675
+ }
676
+ const page = browser.getPage();
677
+ return successResponse(command.id, {
678
+ snapshot: tree || 'Empty page',
679
+ refs: Object.keys(simpleRefs).length > 0 ? simpleRefs : undefined,
680
+ origin: page.url(),
681
+ });
682
+ }
683
+ async function handleEvaluate(command, browser) {
684
+ const page = browser.getPage();
685
+ // Evaluate the script directly as a string expression
686
+ const result = await page.evaluate(command.script);
687
+ return successResponse(command.id, { result, origin: page.url() });
688
+ }
689
+ async function handleWait(command, browser) {
690
+ const page = browser.getPage();
691
+ if (command.selector) {
692
+ await page.waitForSelector(command.selector, {
693
+ state: command.state ?? 'visible',
694
+ timeout: command.timeout,
695
+ });
696
+ }
697
+ else if (command.timeout) {
698
+ await page.waitForTimeout(command.timeout);
699
+ }
700
+ else {
701
+ // Default: wait for load state
702
+ await page.waitForLoadState('load');
703
+ }
704
+ return successResponse(command.id, { waited: true });
705
+ }
706
+ async function handleScroll(command, browser) {
707
+ const page = browser.getPage();
708
+ let deltaX = command.x ?? 0;
709
+ let deltaY = command.y ?? 0;
710
+ const hasExplicitDelta = command.x !== undefined || command.y !== undefined;
711
+ if (command.direction) {
712
+ const amount = command.amount ?? 100;
713
+ switch (command.direction) {
714
+ case 'up':
715
+ deltaY = -amount;
716
+ break;
717
+ case 'down':
718
+ deltaY = amount;
719
+ break;
720
+ case 'left':
721
+ deltaX = -amount;
722
+ break;
723
+ case 'right':
724
+ deltaX = amount;
725
+ break;
726
+ }
727
+ }
728
+ if (command.selector) {
729
+ const element = browser.getLocator(command.selector);
730
+ await element.scrollIntoViewIfNeeded();
731
+ if (hasExplicitDelta || deltaX !== 0 || deltaY !== 0) {
732
+ await element.evaluate((el, { x, y }) => {
733
+ el.scrollBy(x, y);
734
+ }, { x: deltaX, y: deltaY });
735
+ }
736
+ }
737
+ else {
738
+ await page.evaluate(`window.scrollBy(${deltaX}, ${deltaY})`);
739
+ }
740
+ return successResponse(command.id, { scrolled: true });
741
+ }
742
+ async function handleSelect(command, browser) {
743
+ const locator = browser.getLocator(command.selector);
744
+ const values = Array.isArray(command.values) ? command.values : [command.values];
745
+ try {
746
+ await locator.selectOption(values);
747
+ }
748
+ catch (error) {
749
+ throw toAIFriendlyError(error, command.selector);
750
+ }
751
+ return successResponse(command.id, { selected: values });
752
+ }
753
+ async function handleHover(command, browser) {
754
+ const locator = browser.getLocator(command.selector);
755
+ try {
756
+ await locator.hover();
757
+ }
758
+ catch (error) {
759
+ throw toAIFriendlyError(error, command.selector);
760
+ }
761
+ return successResponse(command.id, { hovered: true });
762
+ }
763
+ async function handleContent(command, browser) {
764
+ const page = browser.getPage();
765
+ let html;
766
+ if (command.selector) {
767
+ html = await page.locator(command.selector).innerHTML();
768
+ }
769
+ else {
770
+ html = await page.content();
771
+ }
772
+ return successResponse(command.id, { html, origin: page.url() });
773
+ }
774
+ async function handleClose(command, browser) {
775
+ await browser.close();
776
+ return successResponse(command.id, { closed: true });
777
+ }
778
+ async function handleTabNew(command, browser) {
779
+ const result = await browser.newTab();
780
+ // Navigate to URL if provided (same pattern as handleNavigate)
781
+ if (command.url) {
782
+ const page = browser.getPage();
783
+ await page.goto(command.url, { waitUntil: 'domcontentloaded' });
784
+ }
785
+ return successResponse(command.id, result);
786
+ }
787
+ async function handleTabList(command, browser) {
788
+ const tabs = await browser.listTabs();
789
+ return successResponse(command.id, {
790
+ tabs,
791
+ active: browser.getActiveIndex(),
792
+ });
793
+ }
794
+ async function handleTabSwitch(command, browser) {
795
+ const result = await browser.switchTo(command.index);
796
+ const page = browser.getPage();
797
+ return successResponse(command.id, {
798
+ ...result,
799
+ title: await page.title(),
800
+ });
801
+ }
802
+ async function handleTabClose(command, browser) {
803
+ const result = await browser.closeTab(command.index);
804
+ return successResponse(command.id, result);
805
+ }
806
+ async function handleWindowNew(command, browser) {
807
+ const result = await browser.newWindow(command.viewport);
808
+ return successResponse(command.id, result);
809
+ }
810
+ // New handlers for enhanced Playwright parity
811
+ async function handleFill(command, browser) {
812
+ const locator = browser.getLocator(command.selector);
813
+ try {
814
+ await locator.fill(command.value);
815
+ }
816
+ catch (error) {
817
+ throw toAIFriendlyError(error, command.selector);
818
+ }
819
+ return successResponse(command.id, { filled: true });
820
+ }
821
+ async function handleCheck(command, browser) {
822
+ const locator = browser.getLocator(command.selector);
823
+ try {
824
+ await locator.check();
825
+ }
826
+ catch (error) {
827
+ throw toAIFriendlyError(error, command.selector);
828
+ }
829
+ return successResponse(command.id, { checked: true });
830
+ }
831
+ async function handleUncheck(command, browser) {
832
+ const locator = browser.getLocator(command.selector);
833
+ try {
834
+ await locator.uncheck();
835
+ }
836
+ catch (error) {
837
+ throw toAIFriendlyError(error, command.selector);
838
+ }
839
+ return successResponse(command.id, { unchecked: true });
840
+ }
841
+ async function handleUpload(command, browser) {
842
+ const locator = browser.getLocator(command.selector);
843
+ const files = Array.isArray(command.files) ? command.files : [command.files];
844
+ try {
845
+ await locator.setInputFiles(files);
846
+ }
847
+ catch (error) {
848
+ throw toAIFriendlyError(error, command.selector);
849
+ }
850
+ return successResponse(command.id, { uploaded: files });
851
+ }
852
+ async function handleDoubleClick(command, browser) {
853
+ const locator = browser.getLocator(command.selector);
854
+ try {
855
+ await locator.dblclick();
856
+ }
857
+ catch (error) {
858
+ throw toAIFriendlyError(error, command.selector);
859
+ }
860
+ return successResponse(command.id, { clicked: true });
861
+ }
862
+ async function handleFocus(command, browser) {
863
+ const locator = browser.getLocator(command.selector);
864
+ try {
865
+ await locator.focus();
866
+ }
867
+ catch (error) {
868
+ throw toAIFriendlyError(error, command.selector);
869
+ }
870
+ return successResponse(command.id, { focused: true });
871
+ }
872
+ async function handleDrag(command, browser) {
873
+ const frame = browser.getFrame();
874
+ await frame.dragAndDrop(command.source, command.target);
875
+ return successResponse(command.id, { dragged: true });
876
+ }
877
+ async function handleFrame(command, browser) {
878
+ await browser.switchToFrame({
879
+ selector: command.selector,
880
+ name: command.name,
881
+ url: command.url,
882
+ });
883
+ return successResponse(command.id, { switched: true });
884
+ }
885
+ async function handleMainFrame(command, browser) {
886
+ browser.switchToMainFrame();
887
+ return successResponse(command.id, { switched: true });
888
+ }
889
+ async function handleGetByRole(command, browser) {
890
+ const page = browser.getPage();
891
+ const locator = page.getByRole(command.role, { name: command.name, exact: command.exact });
892
+ switch (command.subaction) {
893
+ case 'click':
894
+ await locator.click();
895
+ return successResponse(command.id, { clicked: true });
896
+ case 'fill':
897
+ await locator.fill(command.value ?? '');
898
+ return successResponse(command.id, { filled: true });
899
+ case 'check':
900
+ await locator.check();
901
+ return successResponse(command.id, { checked: true });
902
+ case 'hover':
903
+ await locator.hover();
904
+ return successResponse(command.id, { hovered: true });
905
+ }
906
+ }
907
+ async function handleGetByText(command, browser) {
908
+ const page = browser.getPage();
909
+ const locator = page.getByText(command.text, { exact: command.exact });
910
+ switch (command.subaction) {
911
+ case 'click':
912
+ await locator.click();
913
+ return successResponse(command.id, { clicked: true });
914
+ case 'hover':
915
+ await locator.hover();
916
+ return successResponse(command.id, { hovered: true });
917
+ }
918
+ }
919
+ async function handleGetByLabel(command, browser) {
920
+ const page = browser.getPage();
921
+ const locator = page.getByLabel(command.label, { exact: command.exact });
922
+ switch (command.subaction) {
923
+ case 'click':
924
+ await locator.click();
925
+ return successResponse(command.id, { clicked: true });
926
+ case 'fill':
927
+ await locator.fill(command.value ?? '');
928
+ return successResponse(command.id, { filled: true });
929
+ case 'check':
930
+ await locator.check();
931
+ return successResponse(command.id, { checked: true });
932
+ }
933
+ }
934
+ async function handleGetByPlaceholder(command, browser) {
935
+ const page = browser.getPage();
936
+ const locator = page.getByPlaceholder(command.placeholder, { exact: command.exact });
937
+ switch (command.subaction) {
938
+ case 'click':
939
+ await locator.click();
940
+ return successResponse(command.id, { clicked: true });
941
+ case 'fill':
942
+ await locator.fill(command.value ?? '');
943
+ return successResponse(command.id, { filled: true });
944
+ }
945
+ }
946
+ async function handleCookiesGet(command, browser) {
947
+ const page = browser.getPage();
948
+ const context = page.context();
949
+ const cookies = await context.cookies(command.urls);
950
+ return successResponse(command.id, { cookies });
951
+ }
952
+ async function handleCookiesSet(command, browser) {
953
+ const page = browser.getPage();
954
+ const context = page.context();
955
+ // Auto-fill URL for cookies that don't have domain/path/url set
956
+ const pageUrl = page.url();
957
+ const cookies = command.cookies.map((cookie) => {
958
+ if (!cookie.url && !cookie.domain && !cookie.path) {
959
+ return { ...cookie, url: pageUrl };
960
+ }
961
+ return cookie;
962
+ });
963
+ await context.addCookies(cookies);
964
+ return successResponse(command.id, { set: true });
965
+ }
966
+ async function handleCookiesClear(command, browser) {
967
+ const page = browser.getPage();
968
+ const context = page.context();
969
+ await context.clearCookies();
970
+ return successResponse(command.id, { cleared: true });
971
+ }
972
+ async function handleStorageGet(command, browser) {
973
+ const page = browser.getPage();
974
+ const storageType = command.type === 'local' ? 'localStorage' : 'sessionStorage';
975
+ if (command.key) {
976
+ const value = await page.evaluate(`${storageType}.getItem(${JSON.stringify(command.key)})`);
977
+ return successResponse(command.id, { key: command.key, value });
978
+ }
979
+ else {
980
+ const data = await page.evaluate(`
981
+ (() => {
982
+ const storage = ${storageType};
983
+ const result = {};
984
+ for (let i = 0; i < storage.length; i++) {
985
+ const key = storage.key(i);
986
+ if (key) result[key] = storage.getItem(key);
987
+ }
988
+ return result;
989
+ })()
990
+ `);
991
+ return successResponse(command.id, { data });
992
+ }
993
+ }
994
+ async function handleStorageSet(command, browser) {
995
+ const page = browser.getPage();
996
+ const storageType = command.type === 'local' ? 'localStorage' : 'sessionStorage';
997
+ await page.evaluate(`${storageType}.setItem(${JSON.stringify(command.key)}, ${JSON.stringify(command.value)})`);
998
+ return successResponse(command.id, { set: true });
999
+ }
1000
+ async function handleStorageClear(command, browser) {
1001
+ const page = browser.getPage();
1002
+ const storageType = command.type === 'local' ? 'localStorage' : 'sessionStorage';
1003
+ await page.evaluate(`${storageType}.clear()`);
1004
+ return successResponse(command.id, { cleared: true });
1005
+ }
1006
+ async function handleDialog(command, browser) {
1007
+ browser.setDialogHandler(command.response, command.promptText);
1008
+ return successResponse(command.id, { handler: 'set', response: command.response });
1009
+ }
1010
+ async function handlePdf(command, browser) {
1011
+ const page = browser.getPage();
1012
+ await page.pdf({
1013
+ path: command.path,
1014
+ format: command.format ?? 'Letter',
1015
+ });
1016
+ return successResponse(command.id, { path: command.path });
1017
+ }
1018
+ // Network & Request handlers
1019
+ async function handleRoute(command, browser) {
1020
+ await browser.addRoute(command.url, {
1021
+ response: command.response,
1022
+ abort: command.abort,
1023
+ });
1024
+ return successResponse(command.id, { routed: command.url });
1025
+ }
1026
+ async function handleUnroute(command, browser) {
1027
+ await browser.removeRoute(command.url);
1028
+ return successResponse(command.id, { unrouted: command.url ?? 'all' });
1029
+ }
1030
+ async function handleRequests(command, browser) {
1031
+ if (command.clear) {
1032
+ browser.clearRequests();
1033
+ return successResponse(command.id, { cleared: true });
1034
+ }
1035
+ // Start tracking if not already
1036
+ browser.startRequestTracking();
1037
+ const requests = browser.getRequests(command.filter);
1038
+ return successResponse(command.id, { requests });
1039
+ }
1040
+ async function handleDownload(command, browser) {
1041
+ const page = browser.getPage();
1042
+ const locator = browser.getLocator(command.selector);
1043
+ const [download] = await Promise.all([page.waitForEvent('download'), locator.click()]);
1044
+ await download.saveAs(command.path);
1045
+ return successResponse(command.id, {
1046
+ path: command.path,
1047
+ suggestedFilename: download.suggestedFilename(),
1048
+ });
1049
+ }
1050
+ async function handleGeolocation(command, browser) {
1051
+ await browser.setGeolocation(command.latitude, command.longitude, command.accuracy);
1052
+ return successResponse(command.id, {
1053
+ latitude: command.latitude,
1054
+ longitude: command.longitude,
1055
+ });
1056
+ }
1057
+ async function handlePermissions(command, browser) {
1058
+ await browser.setPermissions(command.permissions, command.grant);
1059
+ return successResponse(command.id, {
1060
+ permissions: command.permissions,
1061
+ granted: command.grant,
1062
+ });
1063
+ }
1064
+ async function handleViewport(command, browser) {
1065
+ await browser.setViewport(command.width, command.height);
1066
+ return successResponse(command.id, {
1067
+ width: command.width,
1068
+ height: command.height,
1069
+ });
1070
+ }
1071
+ async function handleUserAgent(command, browser) {
1072
+ const page = browser.getPage();
1073
+ const context = page.context();
1074
+ // Note: Can't change user agent after context is created, but we can for new pages
1075
+ return successResponse(command.id, {
1076
+ note: 'User agent can only be set at launch time. Use device command instead.',
1077
+ });
1078
+ }
1079
+ async function handleDevice(command, browser) {
1080
+ const device = browser.getDevice(command.device);
1081
+ if (!device) {
1082
+ const available = browser.listDevices().slice(0, 10).join(', ');
1083
+ throw new Error(`Unknown device: ${command.device}. Available: ${available}...`);
1084
+ }
1085
+ // Apply device viewport
1086
+ await browser.setViewport(device.viewport.width, device.viewport.height);
1087
+ // Apply or clear device scale factor
1088
+ if (device.deviceScaleFactor && device.deviceScaleFactor !== 1) {
1089
+ // Apply device scale factor for HiDPI/retina displays
1090
+ await browser.setDeviceScaleFactor(device.deviceScaleFactor, device.viewport.width, device.viewport.height, device.isMobile ?? false);
1091
+ }
1092
+ else {
1093
+ // Clear device scale factor override to restore default (1x)
1094
+ try {
1095
+ await browser.clearDeviceMetricsOverride();
1096
+ }
1097
+ catch {
1098
+ // Ignore error if override was never set
1099
+ }
1100
+ }
1101
+ return successResponse(command.id, {
1102
+ device: command.device,
1103
+ viewport: device.viewport,
1104
+ userAgent: device.userAgent,
1105
+ deviceScaleFactor: device.deviceScaleFactor,
1106
+ });
1107
+ }
1108
+ async function handleBack(command, browser) {
1109
+ const page = browser.getPage();
1110
+ await page.goBack();
1111
+ return successResponse(command.id, { url: page.url() });
1112
+ }
1113
+ async function handleForward(command, browser) {
1114
+ const page = browser.getPage();
1115
+ await page.goForward();
1116
+ return successResponse(command.id, { url: page.url() });
1117
+ }
1118
+ async function handleReload(command, browser) {
1119
+ const page = browser.getPage();
1120
+ await page.reload();
1121
+ return successResponse(command.id, { url: page.url() });
1122
+ }
1123
+ async function handleUrl(command, browser) {
1124
+ const page = browser.getPage();
1125
+ return successResponse(command.id, { url: page.url() });
1126
+ }
1127
+ async function handleTitle(command, browser) {
1128
+ const page = browser.getPage();
1129
+ const title = await page.title();
1130
+ return successResponse(command.id, { title });
1131
+ }
1132
+ async function handleGetAttribute(command, browser) {
1133
+ const page = browser.getPage();
1134
+ const locator = browser.getLocator(command.selector);
1135
+ const value = await locator.getAttribute(command.attribute);
1136
+ return successResponse(command.id, { attribute: command.attribute, value, origin: page.url() });
1137
+ }
1138
+ async function handleGetText(command, browser) {
1139
+ const page = browser.getPage();
1140
+ const locator = browser.getLocator(command.selector);
1141
+ const text = await locator.textContent();
1142
+ return successResponse(command.id, { text, origin: page.url() });
1143
+ }
1144
+ async function handleIsVisible(command, browser) {
1145
+ const locator = browser.getLocator(command.selector);
1146
+ const visible = await locator.isVisible();
1147
+ return successResponse(command.id, { visible });
1148
+ }
1149
+ async function handleIsEnabled(command, browser) {
1150
+ const locator = browser.getLocator(command.selector);
1151
+ const enabled = await locator.isEnabled();
1152
+ return successResponse(command.id, { enabled });
1153
+ }
1154
+ async function handleIsChecked(command, browser) {
1155
+ const locator = browser.getLocator(command.selector);
1156
+ const checked = await locator.isChecked();
1157
+ return successResponse(command.id, { checked });
1158
+ }
1159
+ async function handleCount(command, browser) {
1160
+ const page = browser.getPage();
1161
+ const count = await page.locator(command.selector).count();
1162
+ return successResponse(command.id, { count });
1163
+ }
1164
+ async function handleBoundingBox(command, browser) {
1165
+ const page = browser.getPage();
1166
+ const box = await page.locator(command.selector).boundingBox();
1167
+ return successResponse(command.id, { box });
1168
+ }
1169
+ async function handleStyles(command, browser) {
1170
+ const page = browser.getPage();
1171
+ // Shared extraction logic as a string to be eval'd in browser context
1172
+ const extractStylesScript = `(function(el) {
1173
+ const s = getComputedStyle(el);
1174
+ const r = el.getBoundingClientRect();
1175
+ return {
1176
+ tag: el.tagName.toLowerCase(),
1177
+ text: el.innerText?.trim().slice(0, 80) || null,
1178
+ box: {
1179
+ x: Math.round(r.x),
1180
+ y: Math.round(r.y),
1181
+ width: Math.round(r.width),
1182
+ height: Math.round(r.height),
1183
+ },
1184
+ styles: {
1185
+ fontSize: s.fontSize,
1186
+ fontWeight: s.fontWeight,
1187
+ fontFamily: s.fontFamily.split(',')[0].trim().replace(/"/g, ''),
1188
+ color: s.color,
1189
+ backgroundColor: s.backgroundColor,
1190
+ borderRadius: s.borderRadius,
1191
+ border: s.border !== 'none' && s.borderWidth !== '0px' ? s.border : null,
1192
+ boxShadow: s.boxShadow !== 'none' ? s.boxShadow : null,
1193
+ padding: s.padding,
1194
+ },
1195
+ };
1196
+ })`;
1197
+ // Check if it's a ref - single element
1198
+ if (browser.isRef(command.selector)) {
1199
+ const locator = browser.getLocator(command.selector);
1200
+ const element = (await locator.evaluate((el, script) => {
1201
+ const fn = eval(script);
1202
+ return fn(el);
1203
+ }, extractStylesScript));
1204
+ return successResponse(command.id, { elements: [element] });
1205
+ }
1206
+ // CSS selector - can match multiple elements
1207
+ const elements = (await page.$$eval(command.selector, (els, script) => {
1208
+ const fn = eval(script);
1209
+ return els.map((el) => fn(el));
1210
+ }, extractStylesScript));
1211
+ return successResponse(command.id, { elements });
1212
+ }
1213
+ // Advanced handlers
1214
+ async function handleVideoStart(command, browser) {
1215
+ // Video recording requires context-level setup at launch
1216
+ // For now, return a note about this limitation
1217
+ return successResponse(command.id, {
1218
+ note: 'Video recording must be enabled at browser launch. Use --video flag when starting.',
1219
+ path: command.path,
1220
+ });
1221
+ }
1222
+ async function handleVideoStop(command, browser) {
1223
+ const page = browser.getPage();
1224
+ const video = page.video();
1225
+ if (video) {
1226
+ const path = await video.path();
1227
+ return successResponse(command.id, { path });
1228
+ }
1229
+ return successResponse(command.id, { note: 'No video recording active' });
1230
+ }
1231
+ async function handleTraceStart(command, browser) {
1232
+ await browser.startTracing({
1233
+ screenshots: command.screenshots,
1234
+ snapshots: command.snapshots,
1235
+ });
1236
+ return successResponse(command.id, { started: true });
1237
+ }
1238
+ async function handleTraceStop(command, browser) {
1239
+ await browser.stopTracing(command.path);
1240
+ return successResponse(command.id, command.path ? { path: command.path } : { traceStopped: true });
1241
+ }
1242
+ async function handleProfilerStart(command, browser) {
1243
+ await browser.startProfiling({ categories: command.categories });
1244
+ return successResponse(command.id, { started: true });
1245
+ }
1246
+ async function handleProfilerStop(command, browser) {
1247
+ let outputPath = command.path;
1248
+ if (!outputPath) {
1249
+ const timestamp = new Date().toISOString().replace(/[:.]/g, '-');
1250
+ const random = Math.random().toString(36).substring(2, 8);
1251
+ const filename = `profile-${timestamp}-${random}.json`;
1252
+ const profileDir = path.join(getAppDir(), 'tmp', 'profiles');
1253
+ mkdirSync(profileDir, { recursive: true });
1254
+ outputPath = path.join(profileDir, filename);
1255
+ }
1256
+ const result = await browser.stopProfiling(outputPath);
1257
+ return successResponse(command.id, result);
1258
+ }
1259
+ async function handleHarStart(command, browser) {
1260
+ await browser.startHarRecording();
1261
+ browser.startRequestTracking();
1262
+ return successResponse(command.id, { started: true });
1263
+ }
1264
+ async function handleHarStop(command, browser) {
1265
+ // HAR recording is handled at context level
1266
+ // For now, we save tracked requests as a simplified HAR-like format
1267
+ const requests = browser.getRequests();
1268
+ return successResponse(command.id, {
1269
+ path: command.path,
1270
+ requestCount: requests.length,
1271
+ });
1272
+ }
1273
+ async function handleStateSave(command, browser) {
1274
+ await browser.saveStorageState(command.path);
1275
+ return successResponse(command.id, { path: command.path });
1276
+ }
1277
+ async function handleStateLoad(command, browser) {
1278
+ if (browser.isLaunched()) {
1279
+ return errorResponse(command.id, 'Cannot load state while browser is running. Close browser first, then relaunch with loaded state.');
1280
+ }
1281
+ if (!fs.existsSync(command.path)) {
1282
+ return errorResponse(command.id, `State file not found: ${command.path}`);
1283
+ }
1284
+ await browser.launch({
1285
+ id: command.id,
1286
+ action: 'launch',
1287
+ headless: true,
1288
+ autoStateFilePath: command.path,
1289
+ });
1290
+ return successResponse(command.id, {
1291
+ loaded: true,
1292
+ path: command.path,
1293
+ });
1294
+ }
1295
+ async function handleStateList(command) {
1296
+ const sessionsDir = getSessionsDir();
1297
+ const files = listStateFiles();
1298
+ if (files.length === 0) {
1299
+ return successResponse(command.id, { files: [], directory: sessionsDir });
1300
+ }
1301
+ const stateFiles = files
1302
+ .map((filename) => {
1303
+ const filepath = path.join(sessionsDir, filename);
1304
+ const stats = fs.statSync(filepath);
1305
+ let encrypted = false;
1306
+ try {
1307
+ const content = fs.readFileSync(filepath, 'utf-8');
1308
+ const parsed = JSON.parse(content);
1309
+ encrypted = isEncryptedPayload(parsed);
1310
+ }
1311
+ catch {
1312
+ // Ignore parse errors
1313
+ }
1314
+ return {
1315
+ filename,
1316
+ path: filepath,
1317
+ size: stats.size,
1318
+ modified: stats.mtime.toISOString(),
1319
+ encrypted,
1320
+ };
1321
+ })
1322
+ .sort((a, b) => new Date(b.modified).getTime() - new Date(a.modified).getTime());
1323
+ return successResponse(command.id, { files: stateFiles, directory: sessionsDir });
1324
+ }
1325
+ async function handleStateClear(command) {
1326
+ const sessionsDir = getSessionsDir();
1327
+ if (command.sessionName && !isValidSessionName(command.sessionName)) {
1328
+ return errorResponse(command.id, 'Invalid session name. Use only letters, numbers, dashes, and underscores.');
1329
+ }
1330
+ const files = listStateFiles();
1331
+ if (files.length === 0) {
1332
+ return successResponse(command.id, { cleared: 0, deleted: [] });
1333
+ }
1334
+ const deleted = [];
1335
+ if (command.all) {
1336
+ for (const file of files) {
1337
+ fs.unlinkSync(path.join(sessionsDir, file));
1338
+ deleted.push(file);
1339
+ }
1340
+ }
1341
+ else if (command.sessionName) {
1342
+ for (const file of files) {
1343
+ if (file.startsWith(`${command.sessionName}-`)) {
1344
+ fs.unlinkSync(path.join(sessionsDir, file));
1345
+ deleted.push(file);
1346
+ }
1347
+ }
1348
+ }
1349
+ return successResponse(command.id, { cleared: deleted.length, deleted });
1350
+ }
1351
+ async function handleStateShow(command) {
1352
+ const sessionsDir = getSessionsDir();
1353
+ const baseName = command.filename.replace(/\.json$/, '');
1354
+ if (!command.filename.endsWith('.json') || !isValidSessionName(baseName)) {
1355
+ return errorResponse(command.id, 'Invalid filename. Use only letters, numbers, dashes, and underscores (with .json extension).');
1356
+ }
1357
+ const filepath = path.join(sessionsDir, command.filename);
1358
+ if (!fs.existsSync(filepath)) {
1359
+ return errorResponse(command.id, `State file not found: ${command.filename}`);
1360
+ }
1361
+ try {
1362
+ const { data: state, wasEncrypted } = readStateFile(filepath);
1363
+ const stats = fs.statSync(filepath);
1364
+ const stateObj = state;
1365
+ const cookies = stateObj.cookies?.length || 0;
1366
+ const origins = stateObj.origins?.length || 0;
1367
+ const domains = [...new Set((stateObj.cookies || []).map((c) => c.domain))];
1368
+ return successResponse(command.id, {
1369
+ filename: command.filename,
1370
+ path: filepath,
1371
+ size: stats.size,
1372
+ modified: stats.mtime.toISOString(),
1373
+ encrypted: wasEncrypted,
1374
+ summary: {
1375
+ cookies,
1376
+ origins,
1377
+ domains,
1378
+ },
1379
+ state,
1380
+ });
1381
+ }
1382
+ catch (e) {
1383
+ return errorResponse(command.id, `Failed to parse state file: ${e.message}`);
1384
+ }
1385
+ }
1386
+ async function handleStateClean(command) {
1387
+ const deleted = cleanupExpiredStates(command.days);
1388
+ const keptCount = listStateFiles().length;
1389
+ return successResponse(command.id, {
1390
+ cleaned: deleted.length,
1391
+ deleted,
1392
+ keptCount,
1393
+ days: command.days,
1394
+ });
1395
+ }
1396
+ async function handleStateRename(command) {
1397
+ const sessionsDir = getSessionsDir();
1398
+ if (!isValidSessionName(command.oldName) || !isValidSessionName(command.newName)) {
1399
+ return errorResponse(command.id, 'Invalid name. Use only letters, numbers, dashes, and underscores.');
1400
+ }
1401
+ const oldPath = path.join(sessionsDir, `${command.oldName}.json`);
1402
+ const newPath = path.join(sessionsDir, `${command.newName}.json`);
1403
+ if (!fs.existsSync(oldPath)) {
1404
+ return errorResponse(command.id, `State file not found: ${command.oldName}.json`);
1405
+ }
1406
+ if (fs.existsSync(newPath)) {
1407
+ return errorResponse(command.id, `Destination already exists: ${command.newName}.json`);
1408
+ }
1409
+ fs.renameSync(oldPath, newPath);
1410
+ return successResponse(command.id, {
1411
+ renamed: true,
1412
+ oldName: `${command.oldName}.json`,
1413
+ newName: `${command.newName}.json`,
1414
+ path: newPath,
1415
+ });
1416
+ }
1417
+ async function handleConsole(command, browser) {
1418
+ if (command.clear) {
1419
+ browser.clearConsoleMessages();
1420
+ return successResponse(command.id, { cleared: true });
1421
+ }
1422
+ const page = browser.getPage();
1423
+ const messages = browser.getConsoleMessages();
1424
+ return successResponse(command.id, { messages, origin: page.url() });
1425
+ }
1426
+ async function handleErrors(command, browser) {
1427
+ if (command.clear) {
1428
+ browser.clearPageErrors();
1429
+ return successResponse(command.id, { cleared: true });
1430
+ }
1431
+ const errors = browser.getPageErrors();
1432
+ return successResponse(command.id, { errors });
1433
+ }
1434
+ async function handleKeyboard(command, browser) {
1435
+ const page = browser.getPage();
1436
+ const sub = command.subaction ?? 'press';
1437
+ switch (sub) {
1438
+ case 'type':
1439
+ await page.keyboard.type(command.text ?? '', { delay: command.delay });
1440
+ return successResponse(command.id, { typed: true, text: command.text });
1441
+ case 'press':
1442
+ await page.keyboard.press(command.keys ?? '');
1443
+ return successResponse(command.id, { pressed: command.keys });
1444
+ case 'insertText':
1445
+ await page.keyboard.insertText(command.text ?? '');
1446
+ return successResponse(command.id, { inserted: true, text: command.text });
1447
+ default:
1448
+ return errorResponse(command.id, `Unknown keyboard subaction: ${sub}`);
1449
+ }
1450
+ }
1451
+ async function handleWheel(command, browser) {
1452
+ const page = browser.getPage();
1453
+ if (command.selector) {
1454
+ const element = page.locator(command.selector);
1455
+ await element.hover();
1456
+ }
1457
+ await page.mouse.wheel(command.deltaX ?? 0, command.deltaY ?? 0);
1458
+ return successResponse(command.id, { scrolled: true });
1459
+ }
1460
+ async function handleTap(command, browser) {
1461
+ const page = browser.getPage();
1462
+ await page.tap(command.selector);
1463
+ return successResponse(command.id, { tapped: true });
1464
+ }
1465
+ async function handleClipboard(command, browser) {
1466
+ const page = browser.getPage();
1467
+ switch (command.operation) {
1468
+ case 'copy':
1469
+ await page.keyboard.press('Control+c');
1470
+ return successResponse(command.id, { copied: true });
1471
+ case 'paste':
1472
+ await page.keyboard.press('Control+v');
1473
+ return successResponse(command.id, { pasted: true });
1474
+ case 'read':
1475
+ const text = await page.evaluate('navigator.clipboard.readText()');
1476
+ return successResponse(command.id, { text });
1477
+ default:
1478
+ return errorResponse(command.id, 'Unknown clipboard operation');
1479
+ }
1480
+ }
1481
+ async function handleHighlight(command, browser) {
1482
+ const page = browser.getPage();
1483
+ await page.locator(command.selector).highlight();
1484
+ return successResponse(command.id, { highlighted: true });
1485
+ }
1486
+ async function handleClear(command, browser) {
1487
+ const page = browser.getPage();
1488
+ await page.locator(command.selector).clear();
1489
+ return successResponse(command.id, { cleared: true });
1490
+ }
1491
+ async function handleSelectAll(command, browser) {
1492
+ const page = browser.getPage();
1493
+ await page.locator(command.selector).selectText();
1494
+ return successResponse(command.id, { selected: true });
1495
+ }
1496
+ async function handleInnerText(command, browser) {
1497
+ const page = browser.getPage();
1498
+ const text = await page.locator(command.selector).innerText();
1499
+ return successResponse(command.id, { text });
1500
+ }
1501
+ async function handleInnerHtml(command, browser) {
1502
+ const page = browser.getPage();
1503
+ const html = await page.locator(command.selector).innerHTML();
1504
+ return successResponse(command.id, { html, origin: page.url() });
1505
+ }
1506
+ async function handleInputValue(command, browser) {
1507
+ const page = browser.getPage();
1508
+ const locator = browser.getLocator(command.selector);
1509
+ const value = await locator.inputValue();
1510
+ return successResponse(command.id, { value, origin: page.url() });
1511
+ }
1512
+ async function handleSetValue(command, browser) {
1513
+ const page = browser.getPage();
1514
+ await page.locator(command.selector).fill(command.value);
1515
+ return successResponse(command.id, { set: true });
1516
+ }
1517
+ async function handleDispatch(command, browser) {
1518
+ const page = browser.getPage();
1519
+ await page.locator(command.selector).dispatchEvent(command.event, command.eventInit);
1520
+ return successResponse(command.id, { dispatched: command.event });
1521
+ }
1522
+ async function handleEvalHandle(command, browser) {
1523
+ const page = browser.getPage();
1524
+ const handle = await page.evaluateHandle(command.script);
1525
+ const result = await handle.jsonValue().catch(() => 'Handle (non-serializable)');
1526
+ return successResponse(command.id, { result });
1527
+ }
1528
+ async function handleExpose(command, browser) {
1529
+ const page = browser.getPage();
1530
+ await page.exposeFunction(command.name, () => {
1531
+ // Exposed function - can be extended
1532
+ return `Function ${command.name} called`;
1533
+ });
1534
+ return successResponse(command.id, { exposed: command.name });
1535
+ }
1536
+ async function handleAddScript(command, browser) {
1537
+ const page = browser.getPage();
1538
+ if (command.content) {
1539
+ await page.addScriptTag({ content: command.content });
1540
+ }
1541
+ else if (command.url) {
1542
+ await page.addScriptTag({ url: command.url });
1543
+ }
1544
+ return successResponse(command.id, { added: true });
1545
+ }
1546
+ async function handleAddStyle(command, browser) {
1547
+ const page = browser.getPage();
1548
+ if (command.content) {
1549
+ await page.addStyleTag({ content: command.content });
1550
+ }
1551
+ else if (command.url) {
1552
+ await page.addStyleTag({ url: command.url });
1553
+ }
1554
+ return successResponse(command.id, { added: true });
1555
+ }
1556
+ async function handleEmulateMedia(command, browser) {
1557
+ const page = browser.getPage();
1558
+ await page.emulateMedia({
1559
+ media: command.media,
1560
+ colorScheme: command.colorScheme,
1561
+ reducedMotion: command.reducedMotion,
1562
+ forcedColors: command.forcedColors,
1563
+ });
1564
+ if (command.colorScheme) {
1565
+ browser.setColorScheme(command.colorScheme);
1566
+ }
1567
+ return successResponse(command.id, { emulated: true });
1568
+ }
1569
+ async function handleOffline(command, browser) {
1570
+ await browser.setOffline(command.offline);
1571
+ return successResponse(command.id, { offline: command.offline });
1572
+ }
1573
+ async function handleHeaders(command, browser) {
1574
+ await browser.setExtraHeaders(command.headers);
1575
+ return successResponse(command.id, { set: true });
1576
+ }
1577
+ async function handlePause(command, browser) {
1578
+ const page = browser.getPage();
1579
+ await page.pause();
1580
+ return successResponse(command.id, { paused: true });
1581
+ }
1582
+ async function handleGetByAltText(command, browser) {
1583
+ const page = browser.getPage();
1584
+ const locator = page.getByAltText(command.text, { exact: command.exact });
1585
+ switch (command.subaction) {
1586
+ case 'click':
1587
+ await locator.click();
1588
+ return successResponse(command.id, { clicked: true });
1589
+ case 'hover':
1590
+ await locator.hover();
1591
+ return successResponse(command.id, { hovered: true });
1592
+ }
1593
+ }
1594
+ async function handleGetByTitle(command, browser) {
1595
+ const page = browser.getPage();
1596
+ const locator = page.getByTitle(command.text, { exact: command.exact });
1597
+ switch (command.subaction) {
1598
+ case 'click':
1599
+ await locator.click();
1600
+ return successResponse(command.id, { clicked: true });
1601
+ case 'hover':
1602
+ await locator.hover();
1603
+ return successResponse(command.id, { hovered: true });
1604
+ }
1605
+ }
1606
+ async function handleGetByTestId(command, browser) {
1607
+ const page = browser.getPage();
1608
+ const locator = page.getByTestId(command.testId);
1609
+ switch (command.subaction) {
1610
+ case 'click':
1611
+ await locator.click();
1612
+ return successResponse(command.id, { clicked: true });
1613
+ case 'fill':
1614
+ await locator.fill(command.value ?? '');
1615
+ return successResponse(command.id, { filled: true });
1616
+ case 'check':
1617
+ await locator.check();
1618
+ return successResponse(command.id, { checked: true });
1619
+ case 'hover':
1620
+ await locator.hover();
1621
+ return successResponse(command.id, { hovered: true });
1622
+ }
1623
+ }
1624
+ async function handleNth(command, browser) {
1625
+ const page = browser.getPage();
1626
+ const base = page.locator(command.selector);
1627
+ const locator = command.index === -1 ? base.last() : base.nth(command.index);
1628
+ switch (command.subaction) {
1629
+ case 'click':
1630
+ await locator.click();
1631
+ return successResponse(command.id, { clicked: true });
1632
+ case 'fill':
1633
+ await locator.fill(command.value ?? '');
1634
+ return successResponse(command.id, { filled: true });
1635
+ case 'check':
1636
+ await locator.check();
1637
+ return successResponse(command.id, { checked: true });
1638
+ case 'hover':
1639
+ await locator.hover();
1640
+ return successResponse(command.id, { hovered: true });
1641
+ case 'text':
1642
+ const text = await locator.textContent();
1643
+ return successResponse(command.id, { text });
1644
+ }
1645
+ }
1646
+ async function handleWaitForUrl(command, browser) {
1647
+ const page = browser.getPage();
1648
+ await page.waitForURL(command.url, { timeout: command.timeout });
1649
+ return successResponse(command.id, { url: page.url() });
1650
+ }
1651
+ async function handleWaitForLoadState(command, browser) {
1652
+ const page = browser.getPage();
1653
+ await page.waitForLoadState(command.state, { timeout: command.timeout });
1654
+ return successResponse(command.id, { state: command.state });
1655
+ }
1656
+ async function handleSetContent(command, browser) {
1657
+ const page = browser.getPage();
1658
+ await page.setContent(command.html);
1659
+ return successResponse(command.id, { set: true });
1660
+ }
1661
+ async function handleTimezone(command, browser) {
1662
+ // Timezone must be set at context level before navigation
1663
+ // This is a limitation - it sets for the current context
1664
+ const page = browser.getPage();
1665
+ await page.context().setGeolocation({ latitude: 0, longitude: 0 }); // Trigger context awareness
1666
+ return successResponse(command.id, {
1667
+ note: 'Timezone must be set at browser launch. Use --timezone flag.',
1668
+ timezone: command.timezone,
1669
+ });
1670
+ }
1671
+ async function handleLocale(command, browser) {
1672
+ // Locale must be set at context creation
1673
+ return successResponse(command.id, {
1674
+ note: 'Locale must be set at browser launch. Use --locale flag.',
1675
+ locale: command.locale,
1676
+ });
1677
+ }
1678
+ async function handleCredentials(command, browser) {
1679
+ const context = browser.getPage().context();
1680
+ await context.setHTTPCredentials({
1681
+ username: command.username,
1682
+ password: command.password,
1683
+ });
1684
+ return successResponse(command.id, { set: true });
1685
+ }
1686
+ async function handleMouseMove(command, browser) {
1687
+ const page = browser.getPage();
1688
+ await page.mouse.move(command.x, command.y);
1689
+ return successResponse(command.id, { moved: true, x: command.x, y: command.y });
1690
+ }
1691
+ async function handleMouseDown(command, browser) {
1692
+ const page = browser.getPage();
1693
+ await page.mouse.down({ button: command.button ?? 'left' });
1694
+ return successResponse(command.id, { down: true });
1695
+ }
1696
+ async function handleMouseUp(command, browser) {
1697
+ const page = browser.getPage();
1698
+ await page.mouse.up({ button: command.button ?? 'left' });
1699
+ return successResponse(command.id, { up: true });
1700
+ }
1701
+ async function handleBringToFront(command, browser) {
1702
+ const page = browser.getPage();
1703
+ await page.bringToFront();
1704
+ return successResponse(command.id, { focused: true });
1705
+ }
1706
+ async function handleWaitForFunction(command, browser) {
1707
+ const page = browser.getPage();
1708
+ await page.waitForFunction(command.expression, { timeout: command.timeout });
1709
+ return successResponse(command.id, { waited: true });
1710
+ }
1711
+ async function handleScrollIntoView(command, browser) {
1712
+ await browser.getLocator(command.selector).scrollIntoViewIfNeeded();
1713
+ return successResponse(command.id, { scrolled: true });
1714
+ }
1715
+ async function handleAddInitScript(command, browser) {
1716
+ const context = browser.getPage().context();
1717
+ await context.addInitScript(command.script);
1718
+ return successResponse(command.id, { added: true });
1719
+ }
1720
+ async function handleKeyDown(command, browser) {
1721
+ const page = browser.getPage();
1722
+ await page.keyboard.down(command.key);
1723
+ return successResponse(command.id, { down: true, key: command.key });
1724
+ }
1725
+ async function handleKeyUp(command, browser) {
1726
+ const page = browser.getPage();
1727
+ await page.keyboard.up(command.key);
1728
+ return successResponse(command.id, { up: true, key: command.key });
1729
+ }
1730
+ async function handleInsertText(command, browser) {
1731
+ const page = browser.getPage();
1732
+ await page.keyboard.insertText(command.text);
1733
+ return successResponse(command.id, { inserted: true });
1734
+ }
1735
+ async function handleMultiSelect(command, browser) {
1736
+ const page = browser.getPage();
1737
+ const selected = await page.locator(command.selector).selectOption(command.values);
1738
+ return successResponse(command.id, { selected });
1739
+ }
1740
+ async function handleWaitForDownload(command, browser) {
1741
+ const page = browser.getPage();
1742
+ const download = await page.waitForEvent('download', { timeout: command.timeout });
1743
+ let filePath;
1744
+ if (command.path) {
1745
+ filePath = command.path;
1746
+ await download.saveAs(filePath);
1747
+ }
1748
+ else {
1749
+ filePath = (await download.path()) || download.suggestedFilename();
1750
+ }
1751
+ return successResponse(command.id, {
1752
+ path: filePath,
1753
+ filename: download.suggestedFilename(),
1754
+ url: download.url(),
1755
+ });
1756
+ }
1757
+ async function handleResponseBody(command, browser) {
1758
+ const page = browser.getPage();
1759
+ const response = await page.waitForResponse((resp) => resp.url().includes(command.url), {
1760
+ timeout: command.timeout,
1761
+ });
1762
+ const body = await response.text();
1763
+ let parsed = body;
1764
+ try {
1765
+ parsed = JSON.parse(body);
1766
+ }
1767
+ catch {
1768
+ // Keep as string if not JSON
1769
+ }
1770
+ return successResponse(command.id, {
1771
+ url: response.url(),
1772
+ status: response.status(),
1773
+ body: parsed,
1774
+ });
1775
+ }
1776
+ // Screencast and input injection handlers
1777
+ async function handleScreencastStart(command, browser) {
1778
+ if (!screencastFrameCallback) {
1779
+ throw new Error('Screencast frame callback not set. Start the streaming server first.');
1780
+ }
1781
+ await browser.startScreencast(screencastFrameCallback, {
1782
+ format: command.format,
1783
+ quality: command.quality,
1784
+ maxWidth: command.maxWidth,
1785
+ maxHeight: command.maxHeight,
1786
+ everyNthFrame: command.everyNthFrame,
1787
+ });
1788
+ return successResponse(command.id, {
1789
+ started: true,
1790
+ format: command.format ?? 'jpeg',
1791
+ quality: command.quality ?? 80,
1792
+ });
1793
+ }
1794
+ async function handleScreencastStop(command, browser) {
1795
+ await browser.stopScreencast();
1796
+ return successResponse(command.id, { stopped: true });
1797
+ }
1798
+ async function handleInputMouse(command, browser) {
1799
+ await browser.injectMouseEvent({
1800
+ type: command.type,
1801
+ x: command.x,
1802
+ y: command.y,
1803
+ button: command.button,
1804
+ clickCount: command.clickCount,
1805
+ deltaX: command.deltaX,
1806
+ deltaY: command.deltaY,
1807
+ modifiers: command.modifiers,
1808
+ });
1809
+ return successResponse(command.id, { injected: true });
1810
+ }
1811
+ async function handleInputKeyboard(command, browser) {
1812
+ await browser.injectKeyboardEvent({
1813
+ type: command.type,
1814
+ key: command.key,
1815
+ code: command.code,
1816
+ text: command.text,
1817
+ modifiers: command.modifiers,
1818
+ });
1819
+ return successResponse(command.id, { injected: true });
1820
+ }
1821
+ async function handleInputTouch(command, browser) {
1822
+ await browser.injectTouchEvent({
1823
+ type: command.type,
1824
+ touchPoints: command.touchPoints,
1825
+ modifiers: command.modifiers,
1826
+ });
1827
+ return successResponse(command.id, { injected: true });
1828
+ }
1829
+ // Recording handlers (Playwright native video recording)
1830
+ async function handleRecordingStart(command, browser) {
1831
+ await browser.startRecording(command.path, command.url);
1832
+ return successResponse(command.id, {
1833
+ started: true,
1834
+ path: command.path,
1835
+ });
1836
+ }
1837
+ async function handleRecordingStop(command, browser) {
1838
+ const result = await browser.stopRecording();
1839
+ return successResponse(command.id, result);
1840
+ }
1841
+ async function handleRecordingRestart(command, browser) {
1842
+ const result = await browser.restartRecording(command.path, command.url);
1843
+ return successResponse(command.id, {
1844
+ started: true,
1845
+ path: command.path,
1846
+ previousPath: result.previousPath,
1847
+ stopped: result.stopped,
1848
+ });
1849
+ }
1850
+ // Diff handlers
1851
+ async function handleDiffSnapshot(command, browser) {
1852
+ let before;
1853
+ if (command.baseline) {
1854
+ try {
1855
+ before = fs.readFileSync(command.baseline, 'utf-8');
1856
+ }
1857
+ catch {
1858
+ return errorResponse(command.id, `Cannot read baseline file: ${command.baseline}`);
1859
+ }
1860
+ }
1861
+ else {
1862
+ before = browser.getLastSnapshot();
1863
+ if (!before) {
1864
+ return errorResponse(command.id, 'No previous snapshot in this session. Take a snapshot first, or use --baseline <file>.');
1865
+ }
1866
+ }
1867
+ const page = browser.getPage();
1868
+ const { tree } = await getEnhancedSnapshot(page, {
1869
+ selector: command.selector,
1870
+ compact: command.compact,
1871
+ maxDepth: command.maxDepth,
1872
+ });
1873
+ const after = tree || 'Empty page';
1874
+ const result = diffSnapshots(before, after);
1875
+ browser.setLastSnapshot(after);
1876
+ return successResponse(command.id, result);
1877
+ }
1878
+ async function handleDiffScreenshot(command, browser) {
1879
+ if (!fs.existsSync(command.baseline)) {
1880
+ return errorResponse(command.id, `Baseline file not found: ${command.baseline}`);
1881
+ }
1882
+ const page = browser.getPage();
1883
+ let screenshotBuffer;
1884
+ if (command.selector) {
1885
+ const locator = browser.getLocatorFromRef(command.selector) || page.locator(command.selector);
1886
+ screenshotBuffer = await locator.screenshot({ type: 'png' });
1887
+ }
1888
+ else {
1889
+ screenshotBuffer = await page.screenshot({ fullPage: command.fullPage, type: 'png' });
1890
+ }
1891
+ const baselineBuffer = fs.readFileSync(command.baseline);
1892
+ const ext = path.extname(command.baseline).toLowerCase();
1893
+ const baselineMime = ext === '.jpg' || ext === '.jpeg' ? 'image/jpeg' : 'image/png';
1894
+ const result = await diffScreenshots(page.context(), baselineBuffer, screenshotBuffer, {
1895
+ threshold: command.threshold,
1896
+ outputPath: command.output,
1897
+ baselineMime,
1898
+ });
1899
+ return successResponse(command.id, result);
1900
+ }
1901
+ async function handleDiffUrl(command, browser) {
1902
+ const page = browser.getPage();
1903
+ const waitUntil = command.waitUntil ?? 'load';
1904
+ const snapshotOpts = {
1905
+ selector: command.selector,
1906
+ compact: command.compact,
1907
+ maxDepth: command.maxDepth,
1908
+ };
1909
+ // Capture state of url1
1910
+ await page.goto(command.url1, { waitUntil });
1911
+ const { tree: tree1 } = await getEnhancedSnapshot(page, snapshotOpts);
1912
+ const snapshot1 = tree1 || 'Empty page';
1913
+ let screenshot1;
1914
+ if (command.screenshot) {
1915
+ screenshot1 = await page.screenshot({ fullPage: command.fullPage, type: 'png' });
1916
+ }
1917
+ // Capture state of url2
1918
+ await page.goto(command.url2, { waitUntil });
1919
+ const { tree: tree2 } = await getEnhancedSnapshot(page, snapshotOpts);
1920
+ const snapshot2 = tree2 || 'Empty page';
1921
+ const snapshotDiff = diffSnapshots(snapshot1, snapshot2);
1922
+ const result = { snapshot: snapshotDiff };
1923
+ if (command.screenshot && screenshot1) {
1924
+ const screenshot2 = await page.screenshot({ fullPage: command.fullPage, type: 'png' });
1925
+ result.screenshot = await diffScreenshots(page.context(), screenshot1, screenshot2, {});
1926
+ }
1927
+ return successResponse(command.id, result);
1928
+ }
1929
+ async function handleAuthLogin(command, browser) {
1930
+ const profile = getAuthProfile(command.name);
1931
+ if (!profile) {
1932
+ return errorResponse(command.id, `Auth profile '${command.name}' not found`);
1933
+ }
1934
+ browser.checkDomainAllowed(profile.url);
1935
+ const page = browser.getPage();
1936
+ await page.goto(profile.url, { waitUntil: 'load' });
1937
+ const usingAutoDetect = !profile.usernameSelector && !profile.passwordSelector && !profile.submitSelector;
1938
+ if (usingAutoDetect) {
1939
+ console.error(`[nstbrowser-ai-agent] Auth login '${command.name}': using auto-detected form selectors. ` +
1940
+ `If login fails, specify --username-selector/--password-selector/--submit-selector with auth save.`);
1941
+ }
1942
+ const passSel = profile.passwordSelector || 'input[type="password"]:visible';
1943
+ // Auto-detect selectors ordered from most specific to broadest.
1944
+ // Locale-dependent text matchers (e.g. "Sign in") are intentionally
1945
+ // excluded -- they break on non-English pages.
1946
+ const AUTO_USER_SELECTORS = [
1947
+ 'input[autocomplete="username"]:visible',
1948
+ 'input[type="email"]:visible',
1949
+ 'input[name="username"]:visible',
1950
+ 'input[name="email"]:visible',
1951
+ ];
1952
+ const AUTO_SUBMIT_SELECTORS = ['button[type="submit"]:visible', 'input[type="submit"]:visible'];
1953
+ try {
1954
+ // Resolve username field: custom selector or sequential auto-detect
1955
+ let userLocator;
1956
+ if (profile.usernameSelector) {
1957
+ userLocator = page.locator(profile.usernameSelector).first();
1958
+ }
1959
+ else {
1960
+ userLocator = null;
1961
+ for (const sel of AUTO_USER_SELECTORS) {
1962
+ const loc = page.locator(sel).first();
1963
+ if (await loc.isVisible({ timeout: 1000 }).catch(() => false)) {
1964
+ userLocator = loc;
1965
+ break;
1966
+ }
1967
+ }
1968
+ if (!userLocator) {
1969
+ return errorResponse(command.id, `Auth login failed for '${command.name}': could not find username field. ` +
1970
+ `Specify --username-selector with auth save.`);
1971
+ }
1972
+ }
1973
+ // Resolve submit button: custom selector or sequential auto-detect
1974
+ let submitLocator;
1975
+ if (profile.submitSelector) {
1976
+ submitLocator = page.locator(profile.submitSelector).first();
1977
+ }
1978
+ else {
1979
+ submitLocator = null;
1980
+ for (const sel of AUTO_SUBMIT_SELECTORS) {
1981
+ const loc = page.locator(sel).first();
1982
+ if (await loc.isVisible({ timeout: 1000 }).catch(() => false)) {
1983
+ submitLocator = loc;
1984
+ break;
1985
+ }
1986
+ }
1987
+ if (!submitLocator) {
1988
+ return errorResponse(command.id, `Auth login failed for '${command.name}': could not find submit button. ` +
1989
+ `Specify --submit-selector with auth save.`);
1990
+ }
1991
+ }
1992
+ await userLocator.fill(profile.username);
1993
+ await page.locator(passSel).first().fill(profile.password);
1994
+ await submitLocator.click();
1995
+ await page.waitForLoadState('load');
1996
+ }
1997
+ catch (err) {
1998
+ return errorResponse(command.id, `Auth login failed for '${command.name}': ${err instanceof Error ? err.message : err}. ` +
1999
+ `Try specifying custom selectors with auth save --username-selector/--password-selector/--submit-selector`);
2000
+ }
2001
+ updateLastLogin(command.name);
2002
+ return successResponse(command.id, {
2003
+ loggedIn: true,
2004
+ name: command.name,
2005
+ url: page.url(),
2006
+ title: await page.title(),
2007
+ });
2008
+ }
2009
+ async function handleConfirm(command, browser) {
2010
+ const entry = getAndRemovePending(command.confirmationId);
2011
+ if (!entry) {
2012
+ return errorResponse(command.id, `No pending confirmation with id '${command.confirmationId}'`);
2013
+ }
2014
+ // Re-validate the stored command through the schema to guard against
2015
+ // shape drift between when the confirmation was issued and now.
2016
+ const parseResult = parseCommand(JSON.stringify(entry.command));
2017
+ if (!parseResult.success) {
2018
+ return errorResponse(command.id, `Stored command is no longer valid: ${parseResult.error}`);
2019
+ }
2020
+ const originalCommand = parseResult.command;
2021
+ // Re-check deny list in case policy was updated since the confirmation was issued
2022
+ actionPolicy = reloadPolicyIfChanged();
2023
+ const decision = checkPolicy(originalCommand.action, actionPolicy, new Set());
2024
+ if (decision === 'deny') {
2025
+ const category = getActionCategory(originalCommand.action);
2026
+ return errorResponse(command.id, `Action denied by policy: '${category}' is not allowed`);
2027
+ }
2028
+ return await dispatchAction(originalCommand, browser);
2029
+ }
2030
+ function handleDeny(command) {
2031
+ const entry = getAndRemovePending(command.confirmationId);
2032
+ if (!entry) {
2033
+ return errorResponse(command.id, `No pending confirmation with id '${command.confirmationId}'`);
2034
+ }
2035
+ return successResponse(command.id, { denied: true });
2036
+ }
2037
+ //# sourceMappingURL=actions.js.map