agent-browser 0.0.0 → 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (52) hide show
  1. package/.prettierrc +7 -0
  2. package/README.md +271 -1
  3. package/bin/agent-browser +2 -0
  4. package/dist/actions.d.ts +7 -0
  5. package/dist/actions.d.ts.map +1 -0
  6. package/dist/actions.js +1138 -0
  7. package/dist/actions.js.map +1 -0
  8. package/dist/browser.d.ts +232 -0
  9. package/dist/browser.d.ts.map +1 -0
  10. package/dist/browser.js +477 -0
  11. package/dist/browser.js.map +1 -0
  12. package/dist/browser.test.d.ts +2 -0
  13. package/dist/browser.test.d.ts.map +1 -0
  14. package/dist/browser.test.js +136 -0
  15. package/dist/browser.test.js.map +1 -0
  16. package/dist/client.d.ts +17 -0
  17. package/dist/client.d.ts.map +1 -0
  18. package/dist/client.js +133 -0
  19. package/dist/client.js.map +1 -0
  20. package/dist/daemon.d.ts +29 -0
  21. package/dist/daemon.d.ts.map +1 -0
  22. package/dist/daemon.js +165 -0
  23. package/dist/daemon.js.map +1 -0
  24. package/dist/index.d.ts +3 -0
  25. package/dist/index.d.ts.map +1 -0
  26. package/dist/index.js +972 -0
  27. package/dist/index.js.map +1 -0
  28. package/dist/protocol.d.ts +26 -0
  29. package/dist/protocol.d.ts.map +1 -0
  30. package/dist/protocol.js +717 -0
  31. package/dist/protocol.js.map +1 -0
  32. package/dist/protocol.test.d.ts +2 -0
  33. package/dist/protocol.test.d.ts.map +1 -0
  34. package/dist/protocol.test.js +176 -0
  35. package/dist/protocol.test.js.map +1 -0
  36. package/dist/types.d.ts +604 -0
  37. package/dist/types.d.ts.map +1 -0
  38. package/dist/types.js +2 -0
  39. package/dist/types.js.map +1 -0
  40. package/package.json +36 -7
  41. package/src/actions.ts +1658 -0
  42. package/src/browser.test.ts +157 -0
  43. package/src/browser.ts +586 -0
  44. package/src/client.ts +150 -0
  45. package/src/daemon.ts +187 -0
  46. package/src/index.ts +984 -0
  47. package/src/protocol.test.ts +216 -0
  48. package/src/protocol.ts +848 -0
  49. package/src/types.ts +913 -0
  50. package/tsconfig.json +19 -0
  51. package/vitest.config.ts +9 -0
  52. package/index.js +0 -2
package/src/index.ts ADDED
@@ -0,0 +1,984 @@
1
+ #!/usr/bin/env node
2
+ import * as fs from 'fs';
3
+ import * as os from 'os';
4
+ import * as path from 'path';
5
+ import { send, setDebug, setSession, getSession } from './client.js';
6
+ import type { Response } from './types.js';
7
+
8
+ // ============================================================================
9
+ // Utilities
10
+ // ============================================================================
11
+
12
+ function listSessions(): string[] {
13
+ const tmpDir = os.tmpdir();
14
+ try {
15
+ const files = fs.readdirSync(tmpDir);
16
+ const sessions: string[] = [];
17
+ for (const file of files) {
18
+ const match = file.match(/^agent-browser-(.+)\.pid$/);
19
+ if (match) {
20
+ const pidFile = path.join(tmpDir, file);
21
+ try {
22
+ const pid = parseInt(fs.readFileSync(pidFile, 'utf8').trim(), 10);
23
+ process.kill(pid, 0);
24
+ sessions.push(match[1]);
25
+ } catch {
26
+ /* Process not running */
27
+ }
28
+ }
29
+ }
30
+ return sessions;
31
+ } catch {
32
+ return [];
33
+ }
34
+ }
35
+
36
+ const colors = {
37
+ reset: '\x1b[0m',
38
+ bold: '\x1b[1m',
39
+ dim: '\x1b[2m',
40
+ red: '\x1b[31m',
41
+ green: '\x1b[32m',
42
+ yellow: '\x1b[33m',
43
+ cyan: '\x1b[36m',
44
+ };
45
+
46
+ const c = (color: keyof typeof colors, text: string) => `${colors[color]}${text}${colors.reset}`;
47
+
48
+ function genId(): string {
49
+ return Math.random().toString(36).slice(2, 10);
50
+ }
51
+
52
+ function err(msg: string): never {
53
+ console.error(c('red', 'Error:'), msg);
54
+ process.exit(1);
55
+ }
56
+
57
+ // ============================================================================
58
+ // Help
59
+ // ============================================================================
60
+
61
+ function printHelp(): void {
62
+ console.log(`
63
+ ${c('bold', 'agent-browser')} - headless browser automation for AI agents
64
+
65
+ ${c('yellow', 'Usage:')} agent-browser <command> [options]
66
+
67
+ ${c('yellow', 'Core Commands:')}
68
+ ${c('cyan', 'open')} <url> Navigate to URL
69
+ ${c('cyan', 'click')} <sel> Click element
70
+ ${c('cyan', 'type')} <sel> <text> Type into element
71
+ ${c('cyan', 'fill')} <sel> <text> Clear and fill
72
+ ${c('cyan', 'press')} <key> Press key (Enter, Tab, Control+a)
73
+ ${c('cyan', 'hover')} <sel> Hover element
74
+ ${c('cyan', 'select')} <sel> <val> Select dropdown option
75
+ ${c('cyan', 'scroll')} <dir> [px] Scroll (up/down/left/right)
76
+ ${c('cyan', 'wait')} <sel|ms> Wait for element or time
77
+ ${c('cyan', 'screenshot')} [path] Take screenshot
78
+ ${c('cyan', 'snapshot')} Accessibility tree (for AI)
79
+ ${c('cyan', 'eval')} <js> Run JavaScript
80
+ ${c('cyan', 'close')} Close browser
81
+
82
+ ${c('yellow', 'Get Info:')} agent-browser get <what> [selector]
83
+ text, html, value, attr, title, url, count, box
84
+
85
+ ${c('yellow', 'Check State:')} agent-browser is <what> <selector>
86
+ visible, enabled, checked
87
+
88
+ ${c('yellow', 'Find Elements:')} agent-browser find <locator> <action> [value]
89
+ role, text, label, placeholder, alt, title, testid, first, last, nth
90
+
91
+ ${c('yellow', 'Mouse:')} agent-browser mouse <action> [args]
92
+ move <x> <y>, down, up, wheel <dy>
93
+
94
+ ${c('yellow', 'Storage:')}
95
+ ${c('cyan', 'cookies')} [get|set|clear] Manage cookies
96
+ ${c('cyan', 'storage')} <local|session> Manage web storage
97
+
98
+ ${c('yellow', 'Browser:')} agent-browser set <setting> [value]
99
+ viewport, device, geo, offline, headers, credentials
100
+
101
+ ${c('yellow', 'Network:')} agent-browser network <action>
102
+ route, unroute, requests
103
+
104
+ ${c('yellow', 'Tabs:')}
105
+ ${c('cyan', 'tab')} [new|list|close|<n>] Manage tabs
106
+
107
+ ${c('yellow', 'Debug:')}
108
+ ${c('cyan', 'trace')} start|stop <path> Record trace
109
+ ${c('cyan', 'console')} View console logs
110
+ ${c('cyan', 'errors')} View page errors
111
+
112
+ ${c('yellow', 'Options:')}
113
+ --session <name> Isolated session (or AGENT_BROWSER_SESSION env)
114
+ --json JSON output
115
+ --full, -f Full page screenshot
116
+ --headed Show browser window (not headless)
117
+ --debug Debug output
118
+
119
+ ${c('yellow', 'Examples:')}
120
+ agent-browser open example.com
121
+ agent-browser click "#submit"
122
+ agent-browser fill "#email" "test@example.com"
123
+ agent-browser get text "h1"
124
+ agent-browser is visible ".modal"
125
+ agent-browser find role button click --name Submit
126
+ agent-browser wait 2000
127
+ agent-browser wait --load networkidle
128
+ `);
129
+ }
130
+
131
+ // ============================================================================
132
+ // Response Printing
133
+ // ============================================================================
134
+
135
+ function printResponse(response: Response, jsonMode: boolean): void {
136
+ if (jsonMode) {
137
+ console.log(JSON.stringify(response));
138
+ return;
139
+ }
140
+
141
+ if (!response.success) {
142
+ console.error(c('red', '✗ Error:'), response.error);
143
+ process.exit(1);
144
+ }
145
+
146
+ const data = response.data as Record<string, unknown>;
147
+
148
+ if (data.url && data.title) {
149
+ console.log(c('green', '✓'), c('bold', data.title as string));
150
+ console.log(c('dim', ` ${data.url}`));
151
+ } else if (data.text !== undefined) {
152
+ console.log(data.text ?? c('dim', 'null'));
153
+ } else if (data.html !== undefined) {
154
+ console.log(data.html);
155
+ } else if (data.value !== undefined) {
156
+ console.log(data.value ?? c('dim', 'null'));
157
+ } else if (data.result !== undefined) {
158
+ const result = data.result;
159
+ console.log(typeof result === 'object' ? JSON.stringify(result, null, 2) : result);
160
+ } else if (data.snapshot) {
161
+ console.log(data.snapshot);
162
+ } else if (data.visible !== undefined) {
163
+ console.log(data.visible ? c('green', 'true') : c('red', 'false'));
164
+ } else if (data.enabled !== undefined) {
165
+ console.log(data.enabled ? c('green', 'true') : c('red', 'false'));
166
+ } else if (data.checked !== undefined) {
167
+ console.log(data.checked ? c('green', 'true') : c('red', 'false'));
168
+ } else if (data.count !== undefined) {
169
+ console.log(data.count);
170
+ } else if (data.box) {
171
+ const box = data.box as { x: number; y: number; width: number; height: number };
172
+ console.log(`x:${box.x} y:${box.y} w:${box.width} h:${box.height}`);
173
+ } else if (data.url) {
174
+ console.log(data.url);
175
+ } else if (data.title) {
176
+ console.log(data.title);
177
+ } else if (data.base64) {
178
+ console.log(c('green', '✓'), 'Screenshot captured');
179
+ } else if (data.path) {
180
+ console.log(c('green', '✓'), `Saved: ${data.path}`);
181
+ } else if (data.cookies) {
182
+ const cookies = data.cookies as Array<{ name: string; value: string }>;
183
+ if (cookies.length === 0) console.log(c('dim', 'No cookies'));
184
+ else cookies.forEach((ck) => console.log(`${c('cyan', ck.name)}: ${ck.value}`));
185
+ } else if (data.tabs) {
186
+ const tabs = data.tabs as Array<{ index: number; url: string; title: string; active: boolean }>;
187
+ tabs.forEach((t) => {
188
+ const marker = t.active ? c('green', '→') : ' ';
189
+ console.log(`${marker} [${t.index}] ${t.title || c('dim', '(untitled)')}`);
190
+ if (t.url) console.log(c('dim', ` ${t.url}`));
191
+ });
192
+ } else if (data.index !== undefined && data.total !== undefined) {
193
+ console.log(c('green', '✓'), `Tab ${data.index} (${data.total} total)`);
194
+ } else if (data.messages) {
195
+ const msgs = data.messages as Array<{ type: string; text: string }>;
196
+ if (msgs.length === 0) console.log(c('dim', 'No messages'));
197
+ else
198
+ msgs.forEach((m) => {
199
+ const col = m.type === 'error' ? 'red' : m.type === 'warning' ? 'yellow' : 'dim';
200
+ console.log(`${c(col, `[${m.type}]`)} ${m.text}`);
201
+ });
202
+ } else if (data.errors) {
203
+ const errs = data.errors as Array<{ message: string }>;
204
+ if (errs.length === 0) console.log(c('dim', 'No errors'));
205
+ else errs.forEach((e) => console.log(c('red', '✗'), e.message));
206
+ } else if (data.requests) {
207
+ const reqs = data.requests as Array<{ method: string; url: string }>;
208
+ if (reqs.length === 0) console.log(c('dim', 'No requests'));
209
+ else reqs.forEach((r) => console.log(`${c('cyan', r.method)} ${r.url}`));
210
+ } else if (data.moved) {
211
+ console.log(c('green', '✓'), `Moved to (${data.x}, ${data.y})`);
212
+ } else if (data.body !== undefined && data.status !== undefined) {
213
+ // Response body
214
+ console.log(c('green', '✓'), `${data.status} ${data.url}`);
215
+ console.log(typeof data.body === 'object' ? JSON.stringify(data.body, null, 2) : data.body);
216
+ } else if (data.filename) {
217
+ // Download
218
+ console.log(c('green', '✓'), `Downloaded: ${data.filename}`);
219
+ console.log(c('dim', ` Path: ${data.path}`));
220
+ } else if (data.inserted) {
221
+ console.log(c('green', '✓'), 'Text inserted');
222
+ } else if (data.key) {
223
+ console.log(c('green', '✓'), `Key ${data.down ? 'down' : 'up'}: ${data.key}`);
224
+ } else if (data.note) {
225
+ console.log(c('yellow', '⚠'), data.note);
226
+ } else if (data.closed === true) {
227
+ console.log(c('green', '✓'), 'Browser closed');
228
+ } else if (data.launched) {
229
+ console.log(c('green', '✓'), 'Browser launched');
230
+ } else if (data.state) {
231
+ console.log(c('green', '✓'), `Load state: ${data.state}`);
232
+ } else if (
233
+ Object.keys(data).some((k) =>
234
+ [
235
+ 'clicked',
236
+ 'typed',
237
+ 'filled',
238
+ 'pressed',
239
+ 'hovered',
240
+ 'scrolled',
241
+ 'selected',
242
+ 'waited',
243
+ 'checked',
244
+ 'unchecked',
245
+ 'focused',
246
+ 'set',
247
+ 'cleared',
248
+ 'started',
249
+ 'down',
250
+ 'up',
251
+ ].includes(k)
252
+ )
253
+ ) {
254
+ console.log(c('green', '✓'), 'Done');
255
+ } else {
256
+ console.log(c('green', '✓'), JSON.stringify(data));
257
+ }
258
+ }
259
+
260
+ // ============================================================================
261
+ // Command Handlers
262
+ // ============================================================================
263
+
264
+ async function handleGet(args: string[], id: string): Promise<Record<string, unknown>> {
265
+ const what = args[0];
266
+ const selector = args[1];
267
+
268
+ switch (what) {
269
+ case 'text':
270
+ if (!selector) err('Selector required: agent-browser get text <selector>');
271
+ return { id, action: 'gettext', selector };
272
+ case 'html':
273
+ if (!selector) err('Selector required: agent-browser get html <selector>');
274
+ return { id, action: 'innerhtml', selector };
275
+ case 'value':
276
+ if (!selector) err('Selector required: agent-browser get value <selector>');
277
+ return { id, action: 'inputvalue', selector };
278
+ case 'attr':
279
+ if (!selector || !args[2]) err('Usage: agent-browser get attr <selector> <attribute>');
280
+ return { id, action: 'getattribute', selector, attribute: args[2] };
281
+ case 'title':
282
+ return { id, action: 'title' };
283
+ case 'url':
284
+ return { id, action: 'url' };
285
+ case 'count':
286
+ if (!selector) err('Selector required: agent-browser get count <selector>');
287
+ return { id, action: 'count', selector };
288
+ case 'box':
289
+ if (!selector) err('Selector required: agent-browser get box <selector>');
290
+ return { id, action: 'boundingbox', selector };
291
+ default:
292
+ err(`Unknown: agent-browser get ${what}. Options: text, html, value, attr, title, url, count, box`);
293
+ }
294
+ }
295
+
296
+ async function handleIs(args: string[], id: string): Promise<Record<string, unknown>> {
297
+ const what = args[0];
298
+ const selector = args[1];
299
+
300
+ if (!selector) err(`Selector required: agent-browser is ${what} <selector>`);
301
+
302
+ switch (what) {
303
+ case 'visible':
304
+ return { id, action: 'isvisible', selector };
305
+ case 'enabled':
306
+ return { id, action: 'isenabled', selector };
307
+ case 'checked':
308
+ return { id, action: 'ischecked', selector };
309
+ default:
310
+ err(`Unknown: agent-browser is ${what}. Options: visible, enabled, checked`);
311
+ }
312
+ }
313
+
314
+ async function handleFind(
315
+ args: string[],
316
+ id: string,
317
+ flags: Flags
318
+ ): Promise<Record<string, unknown>> {
319
+ const locator = args[0];
320
+ const value = args[1];
321
+ const subaction = args[2] || 'click';
322
+ const fillValue = args[3];
323
+
324
+ if (!value) err(`Value required: agent-browser find ${locator} <value> <action>`);
325
+
326
+ const exact = flags.exact;
327
+ const name = flags.name;
328
+
329
+ switch (locator) {
330
+ case 'role':
331
+ return { id, action: 'getbyrole', role: value, subaction, value: fillValue, name, exact };
332
+ case 'text':
333
+ return { id, action: 'getbytext', text: value, subaction, exact };
334
+ case 'label':
335
+ return { id, action: 'getbylabel', label: value, subaction, value: fillValue, exact };
336
+ case 'placeholder':
337
+ return {
338
+ id,
339
+ action: 'getbyplaceholder',
340
+ placeholder: value,
341
+ subaction,
342
+ value: fillValue,
343
+ exact,
344
+ };
345
+ case 'alt':
346
+ return { id, action: 'getbyalttext', text: value, subaction, exact };
347
+ case 'title':
348
+ return { id, action: 'getbytitle', text: value, subaction, exact };
349
+ case 'testid':
350
+ return { id, action: 'getbytestid', testId: value, subaction, value: fillValue };
351
+ case 'first':
352
+ return { id, action: 'nth', selector: value, index: 0, subaction, value: fillValue };
353
+ case 'last':
354
+ return { id, action: 'nth', selector: value, index: -1, subaction, value: fillValue };
355
+ case 'nth': {
356
+ const idx = parseInt(value, 10);
357
+ const sel = args[2];
358
+ const act = args[3] || 'click';
359
+ const val = args[4];
360
+ if (isNaN(idx) || !sel) err('Usage: agent-browser find nth <index> <selector> <action>');
361
+ return { id, action: 'nth', selector: sel, index: idx, subaction: act, value: val };
362
+ }
363
+ default:
364
+ err(
365
+ `Unknown locator: ${locator}. Options: role, text, label, placeholder, alt, title, testid, first, last, nth`
366
+ );
367
+ }
368
+ }
369
+
370
+ async function handleMouse(args: string[], id: string): Promise<Record<string, unknown>> {
371
+ const action = args[0];
372
+
373
+ switch (action) {
374
+ case 'move': {
375
+ const x = parseInt(args[1], 10);
376
+ const y = parseInt(args[2], 10);
377
+ if (isNaN(x) || isNaN(y)) err('Usage: agent-browser mouse move <x> <y>');
378
+ return { id, action: 'mousemove', x, y };
379
+ }
380
+ case 'down':
381
+ return { id, action: 'mousedown', button: args[1] || 'left' };
382
+ case 'up':
383
+ return { id, action: 'mouseup', button: args[1] || 'left' };
384
+ case 'wheel': {
385
+ const dy = parseInt(args[1], 10) || 100;
386
+ const dx = parseInt(args[2], 10) || 0;
387
+ return { id, action: 'wheel', deltaY: dy, deltaX: dx };
388
+ }
389
+ default:
390
+ err(`Unknown: agent-browser mouse ${action}. Options: move, down, up, wheel`);
391
+ }
392
+ }
393
+
394
+ async function handleSet(args: string[], id: string): Promise<Record<string, unknown>> {
395
+ const setting = args[0];
396
+
397
+ switch (setting) {
398
+ case 'viewport': {
399
+ const w = parseInt(args[1], 10);
400
+ const h = parseInt(args[2], 10);
401
+ if (isNaN(w) || isNaN(h)) err('Usage: agent-browser set viewport <width> <height>');
402
+ return { id, action: 'viewport', width: w, height: h };
403
+ }
404
+ case 'device':
405
+ if (!args[1]) err('Usage: agent-browser set device <name>');
406
+ return { id, action: 'device', device: args[1] };
407
+ case 'geo':
408
+ case 'geolocation': {
409
+ const lat = parseFloat(args[1]);
410
+ const lng = parseFloat(args[2]);
411
+ if (isNaN(lat) || isNaN(lng)) err('Usage: agent-browser set geo <lat> <lng>');
412
+ return { id, action: 'geolocation', latitude: lat, longitude: lng };
413
+ }
414
+ case 'offline':
415
+ return { id, action: 'offline', offline: args[1] !== 'off' && args[1] !== 'false' };
416
+ case 'headers':
417
+ if (!args[1]) err('Usage: agent-browser set headers <json>');
418
+ try {
419
+ return { id, action: 'headers', headers: JSON.parse(args[1]) };
420
+ } catch {
421
+ err('Invalid JSON for headers');
422
+ }
423
+ break;
424
+ case 'credentials':
425
+ case 'auth':
426
+ if (!args[1] || !args[2]) err('Usage: agent-browser set credentials <user> <pass>');
427
+ return { id, action: 'credentials', username: args[1], password: args[2] };
428
+ case 'media': {
429
+ const colorScheme = args.includes('dark')
430
+ ? 'dark'
431
+ : args.includes('light')
432
+ ? 'light'
433
+ : undefined;
434
+ const media = args.includes('print')
435
+ ? 'print'
436
+ : args.includes('screen')
437
+ ? 'screen'
438
+ : undefined;
439
+ return { id, action: 'emulatemedia', colorScheme, media };
440
+ }
441
+ default:
442
+ err(
443
+ `Unknown: agent-browser set ${setting}. Options: viewport, device, geo, offline, headers, credentials, media`
444
+ );
445
+ }
446
+ return {};
447
+ }
448
+
449
+ async function handleNetwork(
450
+ args: string[],
451
+ id: string,
452
+ allArgs: string[]
453
+ ): Promise<Record<string, unknown>> {
454
+ const action = args[0];
455
+
456
+ switch (action) {
457
+ case 'route': {
458
+ const url = args[1];
459
+ if (!url) err('Usage: agent-browser network route <url> [--abort|--body <json>]');
460
+ const abort = allArgs.includes('--abort');
461
+ const bodyIdx = allArgs.indexOf('--body');
462
+ const body = bodyIdx !== -1 ? allArgs[bodyIdx + 1] : undefined;
463
+ return {
464
+ id,
465
+ action: 'route',
466
+ url,
467
+ abort,
468
+ response: body ? { body, contentType: 'application/json' } : undefined,
469
+ };
470
+ }
471
+ case 'unroute':
472
+ return { id, action: 'unroute', url: args[1] };
473
+ case 'requests': {
474
+ const clear = allArgs.includes('--clear');
475
+ const filterIdx = allArgs.indexOf('--filter');
476
+ const filter = filterIdx !== -1 ? allArgs[filterIdx + 1] : undefined;
477
+ return { id, action: 'requests', clear, filter };
478
+ }
479
+ default:
480
+ err(`Unknown: agent-browser network ${action}. Options: route, unroute, requests`);
481
+ }
482
+ return {};
483
+ }
484
+
485
+ async function handleStorage(args: string[], id: string): Promise<Record<string, unknown>> {
486
+ const type = args[0] as 'local' | 'session';
487
+ const sub = args[1];
488
+
489
+ if (type !== 'local' && type !== 'session') {
490
+ err('Usage: agent-browser storage <local|session> [get|set|clear] [key] [value]');
491
+ }
492
+
493
+ if (sub === 'set') {
494
+ if (!args[2] || !args[3]) err(`Usage: agent-browser storage ${type} set <key> <value>`);
495
+ return { id, action: 'storage_set', type, key: args[2], value: args[3] };
496
+ } else if (sub === 'clear') {
497
+ return { id, action: 'storage_clear', type };
498
+ } else {
499
+ // get (default)
500
+ return { id, action: 'storage_get', type, key: sub };
501
+ }
502
+ }
503
+
504
+ async function handleCookies(args: string[], id: string): Promise<Record<string, unknown>> {
505
+ const sub = args[0];
506
+
507
+ if (sub === 'set') {
508
+ if (!args[1]) err('Usage: agent-browser cookies set <json>');
509
+ try {
510
+ return { id, action: 'cookies_set', cookies: JSON.parse(args[1]) };
511
+ } catch {
512
+ err('Invalid JSON for cookies');
513
+ }
514
+ } else if (sub === 'clear') {
515
+ return { id, action: 'cookies_clear' };
516
+ } else {
517
+ return { id, action: 'cookies_get' };
518
+ }
519
+ return {};
520
+ }
521
+
522
+ async function handleTab(args: string[], id: string): Promise<Record<string, unknown>> {
523
+ const sub = args[0];
524
+
525
+ if (sub === 'new') {
526
+ return { id, action: 'tab_new' };
527
+ } else if (sub === 'list' || sub === 'ls' || !sub) {
528
+ return { id, action: 'tab_list' };
529
+ } else if (sub === 'close') {
530
+ const idx = args[1] !== undefined ? parseInt(args[1], 10) : undefined;
531
+ return { id, action: 'tab_close', index: idx };
532
+ } else {
533
+ const idx = parseInt(sub, 10);
534
+ if (isNaN(idx)) err(`Unknown: agent-browser tab ${sub}. Options: new, list, close, <index>`);
535
+ return { id, action: 'tab_switch', index: idx };
536
+ }
537
+ }
538
+
539
+ async function handleTrace(args: string[], id: string): Promise<Record<string, unknown>> {
540
+ const sub = args[0];
541
+
542
+ if (sub === 'start') {
543
+ return { id, action: 'trace_start', screenshots: true, snapshots: true };
544
+ } else if (sub === 'stop') {
545
+ if (!args[1]) err('Usage: agent-browser trace stop <path>');
546
+ return { id, action: 'trace_stop', path: args[1] };
547
+ } else {
548
+ err('Usage: agent-browser trace start|stop');
549
+ }
550
+ return {};
551
+ }
552
+
553
+ async function handleState(args: string[], id: string): Promise<Record<string, unknown>> {
554
+ const sub = args[0];
555
+ const path = args[1];
556
+
557
+ if (sub === 'save') {
558
+ if (!path) err('Usage: agent-browser state save <path>');
559
+ return { id, action: 'state_save', path };
560
+ } else if (sub === 'load') {
561
+ if (!path) err('Usage: agent-browser state load <path>');
562
+ return { id, action: 'state_load', path };
563
+ } else {
564
+ err('Usage: agent-browser state save|load <path>');
565
+ }
566
+ return {};
567
+ }
568
+
569
+ // ============================================================================
570
+ // Flags Parser
571
+ // ============================================================================
572
+
573
+ interface Flags {
574
+ json: boolean;
575
+ full: boolean;
576
+ text: boolean;
577
+ debug: boolean;
578
+ headed: boolean;
579
+ session: string;
580
+ selector?: string;
581
+ name?: string;
582
+ exact: boolean;
583
+ url?: string;
584
+ load?: string;
585
+ fn?: string;
586
+ }
587
+
588
+ function parseFlags(args: string[]): { flags: Flags; cleanArgs: string[] } {
589
+ const flags: Flags = {
590
+ json: false,
591
+ full: false,
592
+ text: false,
593
+ debug: false,
594
+ headed: false,
595
+ session: process.env.AGENT_BROWSER_SESSION || 'default',
596
+ exact: false,
597
+ };
598
+
599
+ const cleanArgs: string[] = [];
600
+ let i = 0;
601
+
602
+ while (i < args.length) {
603
+ const arg = args[i];
604
+
605
+ if (arg === '--json') {
606
+ flags.json = true;
607
+ } else if (arg === '--full' || arg === '-f') {
608
+ flags.full = true;
609
+ } else if (arg === '--text' || arg === '-t') {
610
+ flags.text = true;
611
+ } else if (arg === '--debug') {
612
+ flags.debug = true;
613
+ } else if (arg === '--headed' || arg === '--head') {
614
+ flags.headed = true;
615
+ } else if (arg === '--exact') {
616
+ flags.exact = true;
617
+ } else if (arg === '--session' && args[i + 1]) {
618
+ flags.session = args[++i];
619
+ } else if ((arg === '--selector' || arg === '-s') && args[i + 1]) {
620
+ flags.selector = args[++i];
621
+ } else if ((arg === '--name' || arg === '-n') && args[i + 1]) {
622
+ flags.name = args[++i];
623
+ } else if (arg === '--url' && args[i + 1]) {
624
+ flags.url = args[++i];
625
+ } else if (arg === '--load' && args[i + 1]) {
626
+ flags.load = args[++i];
627
+ } else if ((arg === '--fn' || arg === '--function') && args[i + 1]) {
628
+ flags.fn = args[++i];
629
+ } else if (!arg.startsWith('-')) {
630
+ cleanArgs.push(arg);
631
+ }
632
+ i++;
633
+ }
634
+
635
+ return { flags, cleanArgs };
636
+ }
637
+
638
+ // ============================================================================
639
+ // Main
640
+ // ============================================================================
641
+
642
+ async function main(): Promise<void> {
643
+ const rawArgs = process.argv.slice(2);
644
+ const { flags, cleanArgs } = parseFlags(rawArgs);
645
+
646
+ if (flags.debug) setDebug(true);
647
+ setSession(flags.session);
648
+
649
+ if (cleanArgs.length === 0 || rawArgs.includes('--help') || rawArgs.includes('-h')) {
650
+ printHelp();
651
+ process.exit(0);
652
+ }
653
+
654
+ const command = cleanArgs[0];
655
+ const args = cleanArgs.slice(1);
656
+ const id = genId();
657
+
658
+ let cmd: Record<string, unknown>;
659
+
660
+ switch (command) {
661
+ // === Core Commands ===
662
+ case 'open':
663
+ case 'goto':
664
+ case 'navigate': {
665
+ if (!args[0]) err('URL required');
666
+ const url = args[0].startsWith('http') ? args[0] : `https://${args[0]}`;
667
+ // If --headed, launch with headless=false first
668
+ if (flags.headed) {
669
+ await send({ id: genId(), action: 'launch', headless: false });
670
+ }
671
+ cmd = { id, action: 'navigate', url };
672
+ break;
673
+ }
674
+
675
+ case 'click':
676
+ if (!args[0]) err('Selector required');
677
+ cmd = { id, action: 'click', selector: args[0] };
678
+ break;
679
+
680
+ case 'dblclick':
681
+ if (!args[0]) err('Selector required');
682
+ cmd = { id, action: 'dblclick', selector: args[0] };
683
+ break;
684
+
685
+ case 'type':
686
+ if (!args[0] || !args[1]) err('Usage: agent-browser type <selector> <text>');
687
+ cmd = { id, action: 'type', selector: args[0], text: args.slice(1).join(' ') };
688
+ break;
689
+
690
+ case 'fill':
691
+ if (!args[0] || !args[1]) err('Usage: agent-browser fill <selector> <text>');
692
+ cmd = { id, action: 'fill', selector: args[0], value: args.slice(1).join(' ') };
693
+ break;
694
+
695
+ case 'press':
696
+ case 'key':
697
+ if (!args[0]) err('Key required');
698
+ cmd = { id, action: 'press', key: args[0] };
699
+ break;
700
+
701
+ case 'keydown':
702
+ if (!args[0]) err('Key required');
703
+ cmd = { id, action: 'keydown', key: args[0] };
704
+ break;
705
+
706
+ case 'keyup':
707
+ if (!args[0]) err('Key required');
708
+ cmd = { id, action: 'keyup', key: args[0] };
709
+ break;
710
+
711
+ case 'hover':
712
+ if (!args[0]) err('Selector required');
713
+ cmd = { id, action: 'hover', selector: args[0] };
714
+ break;
715
+
716
+ case 'focus':
717
+ if (!args[0]) err('Selector required');
718
+ cmd = { id, action: 'focus', selector: args[0] };
719
+ break;
720
+
721
+ case 'check':
722
+ if (!args[0]) err('Selector required');
723
+ cmd = { id, action: 'check', selector: args[0] };
724
+ break;
725
+
726
+ case 'uncheck':
727
+ if (!args[0]) err('Selector required');
728
+ cmd = { id, action: 'uncheck', selector: args[0] };
729
+ break;
730
+
731
+ case 'select':
732
+ if (!args[0] || !args[1]) err('Usage: agent-browser select <selector> <value>');
733
+ cmd = { id, action: 'select', selector: args[0], value: args[1] };
734
+ break;
735
+
736
+ case 'drag':
737
+ if (!args[0] || !args[1]) err('Usage: agent-browser drag <source> <target>');
738
+ cmd = { id, action: 'drag', source: args[0], target: args[1] };
739
+ break;
740
+
741
+ case 'upload':
742
+ if (!args[0] || !args[1]) err('Usage: agent-browser upload <selector> <files...>');
743
+ cmd = { id, action: 'upload', selector: args[0], files: args.slice(1) };
744
+ break;
745
+
746
+ case 'scroll': {
747
+ const dir = args[0] || 'down';
748
+ const amount = parseInt(args[1], 10) || 300;
749
+ cmd = { id, action: 'scroll', direction: dir, amount, selector: flags.selector };
750
+ break;
751
+ }
752
+
753
+ case 'wait': {
754
+ const target = args[0];
755
+ // Check for flags
756
+ if (flags.fn) {
757
+ cmd = { id, action: 'waitforfunction', expression: flags.fn };
758
+ } else if (flags.url) {
759
+ cmd = { id, action: 'waitforurl', url: flags.url };
760
+ } else if (flags.load) {
761
+ cmd = { id, action: 'waitforloadstate', state: flags.load };
762
+ } else if (flags.text) {
763
+ if (!target) err('Text required with --text flag');
764
+ cmd = { id, action: 'wait', text: target };
765
+ } else if (target && /^\d+$/.test(target)) {
766
+ cmd = { id, action: 'wait', timeout: parseInt(target, 10) };
767
+ } else if (target) {
768
+ cmd = { id, action: 'wait', selector: target };
769
+ } else {
770
+ err('Usage: agent-browser wait <selector|ms|--text|--url|--load|--fn>');
771
+ }
772
+ break;
773
+ }
774
+
775
+ case 'screenshot': {
776
+ const path = args[0];
777
+ cmd = { id, action: 'screenshot', path, fullPage: flags.full, selector: flags.selector };
778
+ break;
779
+ }
780
+
781
+ case 'pdf':
782
+ if (!args[0]) err('Path required');
783
+ cmd = { id, action: 'pdf', path: args[0] };
784
+ break;
785
+
786
+ case 'snapshot':
787
+ cmd = { id, action: 'snapshot' };
788
+ break;
789
+
790
+ case 'eval':
791
+ if (!args[0]) err('Script required');
792
+ cmd = { id, action: 'evaluate', script: args.join(' ') };
793
+ break;
794
+
795
+ case 'close':
796
+ case 'quit':
797
+ case 'exit':
798
+ cmd = { id, action: 'close' };
799
+ break;
800
+
801
+ // === Navigation ===
802
+ case 'back':
803
+ cmd = { id, action: 'back' };
804
+ break;
805
+
806
+ case 'forward':
807
+ cmd = { id, action: 'forward' };
808
+ break;
809
+
810
+ case 'reload':
811
+ cmd = { id, action: 'reload' };
812
+ break;
813
+
814
+ // === Grouped Commands ===
815
+ case 'get':
816
+ cmd = await handleGet(args, id);
817
+ break;
818
+
819
+ case 'is':
820
+ cmd = await handleIs(args, id);
821
+ break;
822
+
823
+ case 'find':
824
+ cmd = await handleFind(args, id, flags);
825
+ break;
826
+
827
+ case 'mouse':
828
+ cmd = await handleMouse(args, id);
829
+ break;
830
+
831
+ case 'set':
832
+ cmd = await handleSet(args, id);
833
+ break;
834
+
835
+ case 'network':
836
+ cmd = await handleNetwork(args, id, rawArgs);
837
+ break;
838
+
839
+ case 'storage':
840
+ cmd = await handleStorage(args, id);
841
+ break;
842
+
843
+ case 'cookies':
844
+ cmd = await handleCookies(args, id);
845
+ break;
846
+
847
+ case 'tab':
848
+ cmd = await handleTab(args, id);
849
+ break;
850
+
851
+ case 'window':
852
+ if (args[0] === 'new') {
853
+ cmd = { id, action: 'window_new' };
854
+ } else {
855
+ err('Usage: agent-browser window new');
856
+ }
857
+ break;
858
+
859
+ case 'frame':
860
+ if (!args[0]) err('Selector required');
861
+ if (args[0] === 'main') {
862
+ cmd = { id, action: 'mainframe' };
863
+ } else {
864
+ cmd = { id, action: 'frame', selector: args[0] };
865
+ }
866
+ break;
867
+
868
+ case 'dialog':
869
+ if (args[0] === 'accept') {
870
+ cmd = { id, action: 'dialog', response: 'accept', promptText: args[1] };
871
+ } else if (args[0] === 'dismiss') {
872
+ cmd = { id, action: 'dialog', response: 'dismiss' };
873
+ } else {
874
+ err('Usage: agent-browser dialog accept|dismiss');
875
+ }
876
+ break;
877
+
878
+ case 'trace':
879
+ cmd = await handleTrace(args, id);
880
+ break;
881
+
882
+ case 'state':
883
+ cmd = await handleState(args, id);
884
+ break;
885
+
886
+ case 'console':
887
+ cmd = { id, action: 'console', clear: rawArgs.includes('--clear') };
888
+ break;
889
+
890
+ case 'errors':
891
+ cmd = { id, action: 'errors', clear: rawArgs.includes('--clear') };
892
+ break;
893
+
894
+ case 'highlight':
895
+ if (!args[0]) err('Selector required');
896
+ cmd = { id, action: 'highlight', selector: args[0] };
897
+ break;
898
+
899
+ case 'scrollintoview':
900
+ case 'scrollinto':
901
+ if (!args[0]) err('Selector required');
902
+ cmd = { id, action: 'scrollintoview', selector: args[0] };
903
+ break;
904
+
905
+ case 'initscript':
906
+ if (!args[0]) err('Script required');
907
+ cmd = { id, action: 'addinitscript', script: args.join(' ') };
908
+ break;
909
+
910
+ case 'inserttext':
911
+ case 'insert':
912
+ if (!args[0]) err('Text required');
913
+ cmd = { id, action: 'inserttext', text: args.join(' ') };
914
+ break;
915
+
916
+ case 'multiselect':
917
+ if (!args[0] || args.length < 2)
918
+ err('Usage: agent-browser multiselect <selector> <value1> [value2...]');
919
+ cmd = { id, action: 'multiselect', selector: args[0], values: args.slice(1) };
920
+ break;
921
+
922
+ case 'download':
923
+ cmd = { id, action: 'waitfordownload', path: args[0] };
924
+ break;
925
+
926
+ case 'response':
927
+ if (!args[0]) err('URL pattern required');
928
+ cmd = { id, action: 'responsebody', url: args[0] };
929
+ break;
930
+
931
+ case 'session':
932
+ if (args[0] === 'list' || args[0] === 'ls') {
933
+ const sessions = listSessions();
934
+ const current = getSession();
935
+ if (sessions.length === 0) {
936
+ console.log(c('dim', 'No active sessions'));
937
+ } else {
938
+ sessions.forEach((s) => {
939
+ const marker = s === current ? c('green', '→') : ' ';
940
+ console.log(`${marker} ${c('cyan', s)}`);
941
+ });
942
+ }
943
+ process.exit(0);
944
+ } else {
945
+ console.log(c('cyan', getSession()));
946
+ process.exit(0);
947
+ }
948
+
949
+ // === Legacy aliases for backwards compatibility ===
950
+ case 'url':
951
+ cmd = { id, action: 'url' };
952
+ break;
953
+ case 'title':
954
+ cmd = { id, action: 'title' };
955
+ break;
956
+ case 'gettext':
957
+ cmd = { id, action: 'gettext', selector: args[0] };
958
+ break;
959
+ case 'extract':
960
+ cmd = { id, action: 'content', selector: args[0] };
961
+ break;
962
+
963
+ default:
964
+ console.error(c('red', 'Unknown command:'), command);
965
+ console.error(c('dim', 'Run: agent-browser --help'));
966
+ process.exit(1);
967
+ }
968
+
969
+ try {
970
+ const response = await send(cmd);
971
+ printResponse(response, flags.json);
972
+ process.exit(0);
973
+ } catch (error) {
974
+ const message = error instanceof Error ? error.message : String(error);
975
+ if (flags.json) {
976
+ console.log(JSON.stringify({ id, success: false, error: message }));
977
+ } else {
978
+ console.error(c('red', '✗ Error:'), message);
979
+ }
980
+ process.exit(1);
981
+ }
982
+ }
983
+
984
+ main();