@dyyz1993/agent-browser 0.24.0 → 0.26.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/agent-browser-darwin-arm64 +0 -0
- package/dist/__tests__/e2e/utils/test-helpers.d.ts +2 -2
- package/dist/__tests__/e2e/utils/test-helpers.d.ts.map +1 -1
- package/dist/__tests__/e2e/utils/test-helpers.js +6 -4
- package/dist/__tests__/e2e/utils/test-helpers.js.map +1 -1
- package/dist/actions/advanced.d.ts +73 -0
- package/dist/actions/advanced.d.ts.map +1 -0
- package/dist/actions/advanced.js +390 -0
- package/dist/actions/advanced.js.map +1 -0
- package/dist/actions/context.d.ts +36 -0
- package/dist/actions/context.d.ts.map +1 -0
- package/dist/actions/context.js +164 -0
- package/dist/actions/context.js.map +1 -0
- package/dist/actions/crawl.d.ts +8 -0
- package/dist/actions/crawl.d.ts.map +1 -0
- package/dist/actions/crawl.js +290 -0
- package/dist/actions/crawl.js.map +1 -0
- package/dist/actions/elements.d.ts +11 -0
- package/dist/actions/elements.d.ts.map +1 -0
- package/dist/actions/elements.js +78 -0
- package/dist/actions/elements.js.map +1 -0
- package/dist/actions/flow.d.ts +4 -0
- package/dist/actions/flow.d.ts.map +1 -0
- package/dist/actions/flow.js +170 -0
- package/dist/actions/flow.js.map +1 -0
- package/dist/actions/index.d.ts +7 -0
- package/dist/actions/index.d.ts.map +1 -0
- package/dist/actions/index.js +323 -0
- package/dist/actions/index.js.map +1 -0
- package/dist/actions/interact.d.ts +4 -0
- package/dist/actions/interact.d.ts.map +1 -0
- package/dist/actions/interact.js +162 -0
- package/dist/actions/interact.js.map +1 -0
- package/dist/actions/interaction.d.ts +31 -0
- package/dist/actions/interaction.d.ts.map +1 -0
- package/dist/actions/interaction.js +477 -0
- package/dist/actions/interaction.js.map +1 -0
- package/dist/actions/locators.d.ts +14 -0
- package/dist/actions/locators.d.ts.map +1 -0
- package/dist/actions/locators.js +310 -0
- package/dist/actions/locators.js.map +1 -0
- package/dist/actions/map.d.ts +4 -0
- package/dist/actions/map.d.ts.map +1 -0
- package/dist/actions/map.js +79 -0
- package/dist/actions/map.js.map +1 -0
- package/dist/actions/meta.d.ts +44 -0
- package/dist/actions/meta.d.ts.map +1 -0
- package/dist/actions/meta.js +190 -0
- package/dist/actions/meta.js.map +1 -0
- package/dist/actions/mouse.d.ts +8 -0
- package/dist/actions/mouse.d.ts.map +1 -0
- package/dist/actions/mouse.js +52 -0
- package/dist/actions/mouse.js.map +1 -0
- package/dist/actions/recorder.d.ts +20 -0
- package/dist/actions/recorder.d.ts.map +1 -0
- package/dist/actions/recorder.js +231 -0
- package/dist/actions/recorder.js.map +1 -0
- package/dist/actions/recording.d.ts +6 -0
- package/dist/actions/recording.d.ts.map +1 -0
- package/dist/actions/recording.js +22 -0
- package/dist/actions/recording.js.map +1 -0
- package/dist/actions/scrape.d.ts +10 -0
- package/dist/actions/scrape.d.ts.map +1 -0
- package/dist/actions/scrape.js +39 -0
- package/dist/actions/scrape.js.map +1 -0
- package/dist/actions/screencast.d.ts +8 -0
- package/dist/actions/screencast.d.ts.map +1 -0
- package/dist/actions/screencast.js +56 -0
- package/dist/actions/screencast.js.map +1 -0
- package/dist/actions/search.d.ts +4 -0
- package/dist/actions/search.d.ts.map +1 -0
- package/dist/actions/search.js +129 -0
- package/dist/actions/search.js.map +1 -0
- package/dist/actions/storage.d.ts +14 -0
- package/dist/actions/storage.d.ts.map +1 -0
- package/dist/actions/storage.js +63 -0
- package/dist/actions/storage.js.map +1 -0
- package/dist/actions/tabs.d.ts +16 -0
- package/dist/actions/tabs.d.ts.map +1 -0
- package/dist/actions/tabs.js +47 -0
- package/dist/actions/tabs.js.map +1 -0
- package/dist/actions/utils.d.ts +15 -0
- package/dist/actions/utils.d.ts.map +1 -0
- package/dist/actions/utils.js +234 -0
- package/dist/actions/utils.js.map +1 -0
- package/dist/browser/browser-manager.d.ts +249 -0
- package/dist/browser/browser-manager.d.ts.map +1 -0
- package/dist/browser/browser-manager.js +1251 -0
- package/dist/browser/browser-manager.js.map +1 -0
- package/dist/browser/index.d.ts +3 -0
- package/dist/browser/index.d.ts.map +1 -0
- package/dist/browser/index.js +2 -0
- package/dist/browser/index.js.map +1 -0
- package/dist/browser/network-tracker.d.ts +39 -0
- package/dist/browser/network-tracker.d.ts.map +1 -0
- package/dist/browser/network-tracker.js +287 -0
- package/dist/browser/network-tracker.js.map +1 -0
- package/dist/browser/providers.d.ts +27 -0
- package/dist/browser/providers.d.ts.map +1 -0
- package/dist/browser/providers.js +293 -0
- package/dist/browser/providers.js.map +1 -0
- package/dist/browser/recorder-manager.d.ts +69 -0
- package/dist/browser/recorder-manager.d.ts.map +1 -0
- package/dist/browser/recorder-manager.js +755 -0
- package/dist/browser/recorder-manager.js.map +1 -0
- package/dist/browser/recording-manager.d.ts +46 -0
- package/dist/browser/recording-manager.d.ts.map +1 -0
- package/dist/browser/recording-manager.js +156 -0
- package/dist/browser/recording-manager.js.map +1 -0
- package/dist/browser/screencast-manager.d.ts +49 -0
- package/dist/browser/screencast-manager.d.ts.map +1 -0
- package/dist/browser/screencast-manager.js +131 -0
- package/dist/browser/screencast-manager.js.map +1 -0
- package/dist/browser/types.d.ts +101 -0
- package/dist/browser/types.d.ts.map +1 -0
- package/dist/browser/types.js +2 -0
- package/dist/browser/types.js.map +1 -0
- package/dist/browser-events.d.ts +25 -0
- package/dist/browser-events.d.ts.map +1 -0
- package/dist/browser-events.js +15 -0
- package/dist/browser-events.js.map +1 -0
- package/dist/cli/commands.d.ts.map +1 -1
- package/dist/cli/commands.js +145 -1
- package/dist/cli/commands.js.map +1 -1
- package/dist/cli/connection.d.ts.map +1 -1
- package/dist/cli/connection.js +15 -22
- package/dist/cli/connection.js.map +1 -1
- package/dist/cli/flags.d.ts +1 -0
- package/dist/cli/flags.d.ts.map +1 -1
- package/dist/cli/flags.js +8 -0
- package/dist/cli/flags.js.map +1 -1
- package/dist/cli/help.d.ts.map +1 -1
- package/dist/cli/help.js +204 -4
- package/dist/cli/help.js.map +1 -1
- package/dist/cli/output.d.ts.map +1 -1
- package/dist/cli/output.js +72 -0
- package/dist/cli/output.js.map +1 -1
- package/dist/cli.js +149 -14
- package/dist/cli.js.map +1 -1
- package/dist/daemon.d.ts +1 -1
- package/dist/daemon.d.ts.map +1 -1
- package/dist/daemon.js +12 -13
- package/dist/daemon.js.map +1 -1
- package/dist/flow/exporters/playwright.d.ts +23 -1
- package/dist/flow/exporters/playwright.d.ts.map +1 -1
- package/dist/flow/exporters/playwright.js +333 -85
- package/dist/flow/exporters/playwright.js.map +1 -1
- package/dist/flow/exporters/python.d.ts +22 -0
- package/dist/flow/exporters/python.d.ts.map +1 -1
- package/dist/flow/exporters/python.js +325 -74
- package/dist/flow/exporters/python.js.map +1 -1
- package/dist/flow/exporters/selenium.d.ts.map +1 -1
- package/dist/flow/exporters/selenium.js +0 -1
- package/dist/flow/exporters/selenium.js.map +1 -1
- package/dist/flow/flow-executor.d.ts +1 -1
- package/dist/flow/flow-executor.d.ts.map +1 -1
- package/dist/flow/flow-executor.js +11 -11
- package/dist/flow/flow-executor.js.map +1 -1
- package/dist/flow/output.js.map +1 -1
- package/dist/flow/plugin-system.d.ts +1 -1
- package/dist/flow/plugin-system.d.ts.map +1 -1
- package/dist/flow/plugin-system.js +2 -2
- package/dist/flow/plugin-system.js.map +1 -1
- package/dist/flow/plugins/logging-plugin.js +1 -1
- package/dist/flow/plugins/logging-plugin.js.map +1 -1
- package/dist/flow/presets/console-capture.js +50 -0
- package/dist/flow/presets/fetch-capture.js +107 -0
- package/dist/flow/presets/sse-stream.js +85 -0
- package/dist/flow/presets/xhr-only.js +44 -0
- package/dist/flow/recorder-to-flow.d.ts.map +1 -1
- package/dist/flow/recorder-to-flow.js +1 -3
- package/dist/flow/recorder-to-flow.js.map +1 -1
- package/dist/flow/site-manager.d.ts.map +1 -1
- package/dist/flow/site-manager.js +6 -2
- package/dist/flow/site-manager.js.map +1 -1
- package/dist/human-mouse.d.ts +1 -1
- package/dist/human-mouse.d.ts.map +1 -1
- package/dist/human-mouse.js +2 -2
- package/dist/human-mouse.js.map +1 -1
- package/dist/protocol.d.ts.map +1 -1
- package/dist/protocol.js +91 -1
- package/dist/protocol.js.map +1 -1
- package/dist/rc-config.js +4 -4
- package/dist/rc-config.js.map +1 -1
- package/dist/recorder/inject.js +31 -5
- package/dist/snapshot.d.ts.map +1 -1
- package/dist/snapshot.js +3 -4
- package/dist/snapshot.js.map +1 -1
- package/dist/stream-server-standalone.d.ts +1 -1
- package/dist/stream-server-standalone.d.ts.map +1 -1
- package/dist/stream-server-standalone.js +42 -23
- package/dist/stream-server-standalone.js.map +1 -1
- package/dist/stream-server.d.ts +1 -1
- package/dist/stream-server.d.ts.map +1 -1
- package/dist/stream-server.js +26 -21
- package/dist/stream-server.js.map +1 -1
- package/dist/test-live.js +9 -3
- package/dist/test-live.js.map +1 -1
- package/dist/types.d.ts +123 -2
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js.map +1 -1
- package/package.json +4 -3
- package/scripts/README.md +66 -0
- package/scripts/check_goods_container.js +35 -0
- package/scripts/check_page_content.js +36 -0
- package/scripts/click_applause_rate.js +30 -0
- package/scripts/copy-flow-presets.js +25 -0
- package/scripts/douyin-flow-test.sh +72 -0
- package/scripts/douyin-test.sh +101 -0
- package/scripts/explore_jd_page.js +31 -0
- package/scripts/extract_all_jd_data.js +80 -0
- package/scripts/extract_jd_product_detail.js +62 -0
- package/scripts/extract_jd_products_correct_links.js +78 -0
- package/scripts/extract_jd_products_final.js +80 -0
- package/scripts/extract_jd_reviews.js +48 -0
- package/scripts/extract_jd_seafood_final.js +78 -0
- package/scripts/extract_multiple_products.js +77 -0
- package/scripts/extract_products_no_scroll.js +68 -0
- package/scripts/extract_products_simple.js +68 -0
- package/scripts/find_applause_rate.js +26 -0
- package/scripts/find_jd_links.js +28 -0
- package/scripts/find_main_content.js +20 -0
- package/scripts/find_product_cards.js +38 -0
- package/scripts/find_root_content.js +26 -0
- package/scripts/find_unique_products.js +55 -0
- package/scripts/get_jd_product_detail.js +16 -0
- package/scripts/get_jd_products.js +23 -0
- package/scripts/get_jd_seafood_products.js +44 -0
- package/scripts/get_product_details_from_images.js +54 -0
- package/scripts/verify-form.sh +67 -0
- package/scripts/verify-login.sh +65 -0
- package/scripts/verify-recording.sh +80 -0
- package/scripts/verify-upload.sh +41 -0
- package/bin/agent-browser-darwin-x64 +0 -0
- package/bin/agent-browser-linux-arm64 +0 -0
- package/bin/agent-browser-linux-x64 +0 -0
- package/bin/agent-browser-win32-x64.exe +0 -0
- package/dist/actions.d.ts +0 -51
- package/dist/actions.d.ts.map +0 -1
- package/dist/actions.js +0 -2662
- package/dist/actions.js.map +0 -1
- package/dist/browser.d.ts +0 -651
- package/dist/browser.d.ts.map +0 -1
- package/dist/browser.js +0 -3088
- package/dist/browser.js.map +0 -1
|
@@ -0,0 +1,164 @@
|
|
|
1
|
+
import { successResponse } from '../protocol.js';
|
|
2
|
+
export async function handleDialog(command, browser) {
|
|
3
|
+
browser.setDialogHandler(command.response, command.promptText);
|
|
4
|
+
return successResponse(command.id, { handler: 'set', response: command.response });
|
|
5
|
+
}
|
|
6
|
+
export async function handlePdf(command, browser) {
|
|
7
|
+
const page = browser.getPage();
|
|
8
|
+
await page.pdf({
|
|
9
|
+
path: command.path,
|
|
10
|
+
format: command.format ?? 'Letter',
|
|
11
|
+
});
|
|
12
|
+
return successResponse(command.id, { path: command.path });
|
|
13
|
+
}
|
|
14
|
+
export async function handleRoute(command, browser) {
|
|
15
|
+
await browser.addRoute(command.url, {
|
|
16
|
+
response: command.response,
|
|
17
|
+
abort: command.abort,
|
|
18
|
+
});
|
|
19
|
+
return successResponse(command.id, { routed: command.url });
|
|
20
|
+
}
|
|
21
|
+
export async function handleUnroute(command, browser) {
|
|
22
|
+
await browser.removeRoute(command.url);
|
|
23
|
+
return successResponse(command.id, { unrouted: command.url ?? 'all' });
|
|
24
|
+
}
|
|
25
|
+
export async function handleRequests(command, browser) {
|
|
26
|
+
if (command.clear) {
|
|
27
|
+
browser.clearRequests();
|
|
28
|
+
return successResponse(command.id, { cleared: true });
|
|
29
|
+
}
|
|
30
|
+
const wasTracking = browser.trackingEnabled;
|
|
31
|
+
browser.startRequestTracking(command.captureResponse);
|
|
32
|
+
if (command.output) {
|
|
33
|
+
const result = browser.saveRequestsToDir(command.output, command.filter, command.type);
|
|
34
|
+
return successResponse(command.id, {
|
|
35
|
+
saved: true,
|
|
36
|
+
savedCount: result.savedCount,
|
|
37
|
+
outputPath: result.outputPath,
|
|
38
|
+
indexPath: result.indexPath,
|
|
39
|
+
});
|
|
40
|
+
}
|
|
41
|
+
const requests = browser.getRequests(command.filter, command.type);
|
|
42
|
+
const result = { requests };
|
|
43
|
+
if (requests.length === 0 && !wasTracking) {
|
|
44
|
+
result.hint = 'Request tracking just activated. Reload or navigate to capture requests.';
|
|
45
|
+
}
|
|
46
|
+
return successResponse(command.id, result);
|
|
47
|
+
}
|
|
48
|
+
export async function handleWebSockets(command, browser) {
|
|
49
|
+
if (command.clear) {
|
|
50
|
+
browser.clearWebSockets();
|
|
51
|
+
return successResponse(command.id, { cleared: true });
|
|
52
|
+
}
|
|
53
|
+
const wasTracking = browser.wsTrackingEnabled;
|
|
54
|
+
browser.startWebSocketTracking();
|
|
55
|
+
const sockets = browser.getWebSockets(command.filter);
|
|
56
|
+
const result = { websockets: sockets };
|
|
57
|
+
if (sockets.length === 0 && !wasTracking) {
|
|
58
|
+
result.hint = 'WebSocket tracking just activated. Reload or navigate to capture connections.';
|
|
59
|
+
}
|
|
60
|
+
return successResponse(command.id, result);
|
|
61
|
+
}
|
|
62
|
+
export async function handleDownload(command, browser) {
|
|
63
|
+
const page = browser.getPage();
|
|
64
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
65
|
+
const [download] = await Promise.all([page.waitForEvent('download'), locator.click()]);
|
|
66
|
+
await download.saveAs(command.path);
|
|
67
|
+
return successResponse(command.id, {
|
|
68
|
+
path: command.path,
|
|
69
|
+
suggestedFilename: download.suggestedFilename(),
|
|
70
|
+
});
|
|
71
|
+
}
|
|
72
|
+
export async function handleGeolocation(command, browser) {
|
|
73
|
+
await browser.setGeolocation(command.latitude, command.longitude, command.accuracy);
|
|
74
|
+
return successResponse(command.id, {
|
|
75
|
+
latitude: command.latitude,
|
|
76
|
+
longitude: command.longitude,
|
|
77
|
+
});
|
|
78
|
+
}
|
|
79
|
+
export async function handlePermissions(command, browser) {
|
|
80
|
+
await browser.setPermissions(command.permissions, command.grant);
|
|
81
|
+
return successResponse(command.id, {
|
|
82
|
+
permissions: command.permissions,
|
|
83
|
+
granted: command.grant,
|
|
84
|
+
});
|
|
85
|
+
}
|
|
86
|
+
export async function handleViewport(command, browser) {
|
|
87
|
+
await browser.setViewport(command.width, command.height);
|
|
88
|
+
return successResponse(command.id, {
|
|
89
|
+
width: command.width,
|
|
90
|
+
height: command.height,
|
|
91
|
+
});
|
|
92
|
+
}
|
|
93
|
+
export async function handleUserAgent(command, _browser) {
|
|
94
|
+
return successResponse(command.id, {
|
|
95
|
+
note: 'User agent can only be set at launch time. Use device command instead.',
|
|
96
|
+
});
|
|
97
|
+
}
|
|
98
|
+
export async function handleDevice(command, browser) {
|
|
99
|
+
const device = browser.getDevice(command.device);
|
|
100
|
+
if (!device) {
|
|
101
|
+
const available = browser.listDevices().slice(0, 10).join(', ');
|
|
102
|
+
throw new Error(`Unknown device: ${command.device}. Available: ${available}...`);
|
|
103
|
+
}
|
|
104
|
+
await browser.setViewport(device.viewport.width, device.viewport.height);
|
|
105
|
+
if (device.deviceScaleFactor && device.deviceScaleFactor !== 1) {
|
|
106
|
+
await browser.setDeviceScaleFactor(device.deviceScaleFactor, device.viewport.width, device.viewport.height, device.isMobile ?? false);
|
|
107
|
+
}
|
|
108
|
+
else {
|
|
109
|
+
try {
|
|
110
|
+
await browser.clearDeviceMetricsOverride();
|
|
111
|
+
}
|
|
112
|
+
catch {
|
|
113
|
+
// Ignore error if override was never set
|
|
114
|
+
}
|
|
115
|
+
}
|
|
116
|
+
return successResponse(command.id, {
|
|
117
|
+
device: command.device,
|
|
118
|
+
viewport: device.viewport,
|
|
119
|
+
userAgent: device.userAgent,
|
|
120
|
+
deviceScaleFactor: device.deviceScaleFactor,
|
|
121
|
+
});
|
|
122
|
+
}
|
|
123
|
+
export async function handleBack(command, browser) {
|
|
124
|
+
browser.recordStep({ action: 'back' });
|
|
125
|
+
const page = browser.getPage();
|
|
126
|
+
await page.goBack();
|
|
127
|
+
return successResponse(command.id, { url: page.url() });
|
|
128
|
+
}
|
|
129
|
+
export async function handleForward(command, browser) {
|
|
130
|
+
browser.recordStep({ action: 'forward' });
|
|
131
|
+
const page = browser.getPage();
|
|
132
|
+
await page.goForward();
|
|
133
|
+
return successResponse(command.id, { url: page.url() });
|
|
134
|
+
}
|
|
135
|
+
export async function handleReload(command, browser) {
|
|
136
|
+
browser.recordStep({ action: 'reload' });
|
|
137
|
+
const page = browser.getPage();
|
|
138
|
+
await page.reload();
|
|
139
|
+
return successResponse(command.id, { url: page.url() });
|
|
140
|
+
}
|
|
141
|
+
export async function handleUrl(command, browser) {
|
|
142
|
+
if (command.inFrame) {
|
|
143
|
+
const frameLocator = browser.getFrame(command.inFrame);
|
|
144
|
+
const url = await frameLocator.locator(':root').evaluate(() => window.location.href);
|
|
145
|
+
return successResponse(command.id, { url });
|
|
146
|
+
}
|
|
147
|
+
else {
|
|
148
|
+
const page = browser.getPage();
|
|
149
|
+
return successResponse(command.id, { url: page.url() });
|
|
150
|
+
}
|
|
151
|
+
}
|
|
152
|
+
export async function handleTitle(command, browser) {
|
|
153
|
+
if (command.inFrame) {
|
|
154
|
+
const frameLocator = browser.getFrame(command.inFrame);
|
|
155
|
+
const title = await frameLocator.locator(':root').evaluate(() => document.title);
|
|
156
|
+
return successResponse(command.id, { title });
|
|
157
|
+
}
|
|
158
|
+
else {
|
|
159
|
+
const page = browser.getPage();
|
|
160
|
+
const title = await page.title();
|
|
161
|
+
return successResponse(command.id, { title });
|
|
162
|
+
}
|
|
163
|
+
}
|
|
164
|
+
//# sourceMappingURL=context.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"context.js","sourceRoot":"","sources":["../../src/actions/context.ts"],"names":[],"mappings":"AAeA,OAAO,EAAE,eAAe,EAAE,MAAM,gBAAgB,CAAC;AAEjD,MAAM,CAAC,KAAK,UAAU,YAAY,CAChC,OAAsB,EACtB,OAAuB;IAEvB,OAAO,CAAC,gBAAgB,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,UAAU,CAAC,CAAC;IAC/D,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,OAAO,EAAE,KAAK,EAAE,QAAQ,EAAE,OAAO,CAAC,QAAQ,EAAE,CAAC,CAAC;AACrF,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,SAAS,CAAC,OAAmB,EAAE,OAAuB;IAC1E,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;IAC/B,MAAM,IAAI,CAAC,GAAG,CAAC;QACb,IAAI,EAAE,OAAO,CAAC,IAAI;QAClB,MAAM,EAAE,OAAO,CAAC,MAAM,IAAI,QAAQ;KACnC,CAAC,CAAC;IACH,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,IAAI,EAAE,OAAO,CAAC,IAAI,EAAE,CAAC,CAAC;AAC7D,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,WAAW,CAC/B,OAAqB,EACrB,OAAuB;IAEvB,MAAM,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,GAAG,EAAE;QAClC,QAAQ,EAAE,OAAO,CAAC,QAAQ;QAC1B,KAAK,EAAE,OAAO,CAAC,KAAK;KACrB,CAAC,CAAC;IACH,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,MAAM,EAAE,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;AAC9D,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,aAAa,CACjC,OAAsD,EACtD,OAAuB;IAEvB,MAAM,OAAO,CAAC,WAAW,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC;IACvC,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,QAAQ,EAAE,OAAO,CAAC,GAAG,IAAI,KAAK,EAAE,CAAC,CAAC;AACzE,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,cAAc,CAClC,OAAwB,EACxB,OAAuB;IAEvB,IAAI,OAAO,CAAC,KAAK,EAAE,CAAC;QAClB,OAAO,CAAC,aAAa,EAAE,CAAC;QACxB,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC;IACxD,CAAC;IAED,MAAM,WAAW,GAAG,OAAO,CAAC,eAAe,CAAC;IAC5C,OAAO,CAAC,oBAAoB,CAAC,OAAO,CAAC,eAAe,CAAC,CAAC;IAEtD,IAAI,OAAO,CAAC,MAAM,EAAE,CAAC;QACnB,MAAM,MAAM,GAAG,OAAO,CAAC,iBAAiB,CAAC,OAAO,CAAC,MAAM,EAAE,OAAO,CAAC,MAAM,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;QACvF,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;YACjC,KAAK,EAAE,IAAI;YACX,UAAU,EAAE,MAAM,CAAC,UAAU;YAC7B,UAAU,EAAE,MAAM,CAAC,UAAU;YAC7B,SAAS,EAAE,MAAM,CAAC,SAAS;SAC5B,CAAC,CAAC;IACL,CAAC;IAED,MAAM,QAAQ,GAAG,OAAO,CAAC,WAAW,CAAC,OAAO,CAAC,MAAM,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;IACnE,MAAM,MAAM,GAA4B,EAAE,QAAQ,EAAE,CAAC;IACrD,IAAI,QAAQ,CAAC,MAAM,KAAK,CAAC,IAAI,CAAC,WAAW,EAAE,CAAC;QAC1C,MAAM,CAAC,IAAI,GAAG,0EAA0E,CAAC;IAC3F,CAAC;IACD,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,MAAM,CAAC,CAAC;AAC7C,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,gBAAgB,CACpC,OAA0B,EAC1B,OAAuB;IAEvB,IAAI,OAAO,CAAC,KAAK,EAAE,CAAC;QAClB,OAAO,CAAC,eAAe,EAAE,CAAC;QAC1B,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC;IACxD,CAAC;IAED,MAAM,WAAW,GAAG,OAAO,CAAC,iBAAiB,CAAC;IAC9C,OAAO,CAAC,sBAAsB,EAAE,CAAC;IAEjC,MAAM,OAAO,GAAG,OAAO,CAAC,aAAa,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;IACtD,MAAM,MAAM,GAA4B,EAAE,UAAU,EAAE,OAAO,EAAE,CAAC;IAChE,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC,IAAI,CAAC,WAAW,EAAE,CAAC;QACzC,MAAM,CAAC,IAAI,GAAG,+EAA+E,CAAC;IAChG,CAAC;IACD,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,MAAM,CAAC,CAAC;AAC7C,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,cAAc,CAClC,OAAwB,EACxB,OAAuB;IAEvB,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;IAC/B,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IAEtE,MAAM,CAAC,QAAQ,CAAC,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC,CAAC,IAAI,CAAC,YAAY,CAAC,UAAU,CAAC,EAAE,OAAO,CAAC,KAAK,EAAE,CAAC,CAAC,CAAC;IAEvF,MAAM,QAAQ,CAAC,MAAM,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;IACpC,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;QACjC,IAAI,EAAE,OAAO,CAAC,IAAI;QAClB,iBAAiB,EAAE,QAAQ,CAAC,iBAAiB,EAAE;KAChD,CAAC,CAAC;AACL,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,iBAAiB,CACrC,OAA2B,EAC3B,OAAuB;IAEvB,MAAM,OAAO,CAAC,cAAc,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,SAAS,EAAE,OAAO,CAAC,QAAQ,CAAC,CAAC;IACpF,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;QACjC,QAAQ,EAAE,OAAO,CAAC,QAAQ;QAC1B,SAAS,EAAE,OAAO,CAAC,SAAS;KAC7B,CAAC,CAAC;AACL,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,iBAAiB,CACrC,OAA2B,EAC3B,OAAuB;IAEvB,MAAM,OAAO,CAAC,cAAc,CAAC,OAAO,CAAC,WAAW,EAAE,OAAO,CAAC,KAAK,CAAC,CAAC;IACjE,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;QACjC,WAAW,EAAE,OAAO,CAAC,WAAW;QAChC,OAAO,EAAE,OAAO,CAAC,KAAK;KACvB,CAAC,CAAC;AACL,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,cAAc,CAClC,OAAwB,EACxB,OAAuB;IAEvB,MAAM,OAAO,CAAC,WAAW,CAAC,OAAO,CAAC,KAAK,EAAE,OAAO,CAAC,MAAM,CAAC,CAAC;IACzD,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;QACjC,KAAK,EAAE,OAAO,CAAC,KAAK;QACpB,MAAM,EAAE,OAAO,CAAC,MAAM;KACvB,CAAC,CAAC;AACL,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,eAAe,CACnC,OAA6D,EAC7D,QAAwB;IAExB,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;QACjC,IAAI,EAAE,wEAAwE;KAC/E,CAAC,CAAC;AACL,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,YAAY,CAChC,OAAsB,EACtB,OAAuB;IAEvB,MAAM,MAAM,GAAG,OAAO,CAAC,SAAS,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;IACjD,IAAI,CAAC,MAAM,EAAE,CAAC;QACZ,MAAM,SAAS,GAAG,OAAO,CAAC,WAAW,EAAE,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAChE,MAAM,IAAI,KAAK,CAAC,mBAAmB,OAAO,CAAC,MAAM,gBAAgB,SAAS,KAAK,CAAC,CAAC;IACnF,CAAC;IAED,MAAM,OAAO,CAAC,WAAW,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;IAEzE,IAAI,MAAM,CAAC,iBAAiB,IAAI,MAAM,CAAC,iBAAiB,KAAK,CAAC,EAAE,CAAC;QAC/D,MAAM,OAAO,CAAC,oBAAoB,CAChC,MAAM,CAAC,iBAAiB,EACxB,MAAM,CAAC,QAAQ,CAAC,KAAK,EACrB,MAAM,CAAC,QAAQ,CAAC,MAAM,EACtB,MAAM,CAAC,QAAQ,IAAI,KAAK,CACzB,CAAC;IACJ,CAAC;SAAM,CAAC;QACN,IAAI,CAAC;YACH,MAAM,OAAO,CAAC,0BAA0B,EAAE,CAAC;QAC7C,CAAC;QAAC,MAAM,CAAC;YACP,yCAAyC;QAC3C,CAAC;IACH,CAAC;IAED,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;QACjC,MAAM,EAAE,OAAO,CAAC,MAAM;QACtB,QAAQ,EAAE,MAAM,CAAC,QAAQ;QACzB,SAAS,EAAE,MAAM,CAAC,SAAS;QAC3B,iBAAiB,EAAE,MAAM,CAAC,iBAAiB;KAC5C,CAAC,CAAC;AACL,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,UAAU,CAC9B,OAAqC,EACrC,OAAuB;IAEvB,OAAO,CAAC,UAAU,CAAC,EAAE,MAAM,EAAE,MAAM,EAAE,CAAC,CAAC;IACvC,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;IAC/B,MAAM,IAAI,CAAC,MAAM,EAAE,CAAC;IACpB,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,GAAG,EAAE,IAAI,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC;AAC1D,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,aAAa,CACjC,OAAwC,EACxC,OAAuB;IAEvB,OAAO,CAAC,UAAU,CAAC,EAAE,MAAM,EAAE,SAAS,EAAE,CAAC,CAAC;IAC1C,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;IAC/B,MAAM,IAAI,CAAC,SAAS,EAAE,CAAC;IACvB,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,GAAG,EAAE,IAAI,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC;AAC1D,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,YAAY,CAChC,OAAuC,EACvC,OAAuB;IAEvB,OAAO,CAAC,UAAU,CAAC,EAAE,MAAM,EAAE,QAAQ,EAAE,CAAC,CAAC;IACzC,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;IAC/B,MAAM,IAAI,CAAC,MAAM,EAAE,CAAC;IACpB,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,GAAG,EAAE,IAAI,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC;AAC1D,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,SAAS,CAC7B,OAAoC,EACpC,OAAuB;IAEvB,IAAI,OAAO,CAAC,OAAO,EAAE,CAAC;QACpB,MAAM,YAAY,GAAG,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC;QACvD,MAAM,GAAG,GAAG,MAAM,YAAY,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,QAAQ,CAAC,GAAG,EAAE,CAAC,MAAM,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAC;QACrF,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;IAC9C,CAAC;SAAM,CAAC;QACN,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;QAC/B,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,GAAG,EAAE,IAAI,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC;IAC1D,CAAC;AACH,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,WAAW,CAC/B,OAAsC,EACtC,OAAuB;IAEvB,IAAI,OAAO,CAAC,OAAO,EAAE,CAAC;QACpB,MAAM,YAAY,GAAG,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC;QACvD,MAAM,KAAK,GAAG,MAAM,YAAY,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,QAAQ,CAAC,GAAG,EAAE,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC;QACjF,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,KAAK,EAAE,CAAC,CAAC;IAChD,CAAC;SAAM,CAAC;QACN,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;QAC/B,MAAM,KAAK,GAAG,MAAM,IAAI,CAAC,KAAK,EAAE,CAAC;QACjC,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,KAAK,EAAE,CAAC,CAAC;IAChD,CAAC;AACH,CAAC"}
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
import type { Page } from 'playwright-core';
|
|
2
|
+
import type { BrowserManager } from '../browser/index.js';
|
|
3
|
+
import type { CrawlCommand, CrawlResult, Response } from '../types.js';
|
|
4
|
+
export declare function handleCrawl(command: CrawlCommand, browser: BrowserManager): Promise<Response<CrawlResult>>;
|
|
5
|
+
export declare function discoverLinks(page: Page, baseOrigin: string, baseHostname: string, basePath: string): Promise<string[]>;
|
|
6
|
+
export declare function normalizeUrl(url: string): string;
|
|
7
|
+
export declare function normalizeUrlFromUrl(u: URL): string;
|
|
8
|
+
//# sourceMappingURL=crawl.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"crawl.d.ts","sourceRoot":"","sources":["../../src/actions/crawl.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,IAAI,EAAE,MAAM,iBAAiB,CAAC;AAC5C,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,qBAAqB,CAAC;AAC1D,OAAO,KAAK,EAAE,YAAY,EAAa,WAAW,EAAE,QAAQ,EAAE,MAAM,aAAa,CAAC;AAuElF,wBAAsB,WAAW,CAC/B,OAAO,EAAE,YAAY,EACrB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,WAAW,CAAC,CAAC,CAmGhC;AAoDD,wBAAsB,aAAa,CACjC,IAAI,EAAE,IAAI,EACV,UAAU,EAAE,MAAM,EAClB,YAAY,EAAE,MAAM,EACpB,QAAQ,EAAE,MAAM,GACf,OAAO,CAAC,MAAM,EAAE,CAAC,CAiDnB;AAsCD,wBAAgB,YAAY,CAAC,GAAG,EAAE,MAAM,GAAG,MAAM,CAOhD;AAED,wBAAgB,mBAAmB,CAAC,CAAC,EAAE,GAAG,GAAG,MAAM,CAelD"}
|
|
@@ -0,0 +1,290 @@
|
|
|
1
|
+
import { successResponse } from '../protocol.js';
|
|
2
|
+
import { extractContentFromPage } from './utils.js';
|
|
3
|
+
const STATIC_EXTENSIONS = [
|
|
4
|
+
'.png',
|
|
5
|
+
'.jpg',
|
|
6
|
+
'.jpeg',
|
|
7
|
+
'.gif',
|
|
8
|
+
'.webp',
|
|
9
|
+
'.svg',
|
|
10
|
+
'.ico',
|
|
11
|
+
'.css',
|
|
12
|
+
'.js',
|
|
13
|
+
'.woff',
|
|
14
|
+
'.woff2',
|
|
15
|
+
'.ttf',
|
|
16
|
+
'.eot',
|
|
17
|
+
'.zip',
|
|
18
|
+
'.tar',
|
|
19
|
+
'.gz',
|
|
20
|
+
'.rar',
|
|
21
|
+
'.pdf',
|
|
22
|
+
'.doc',
|
|
23
|
+
'.docx',
|
|
24
|
+
'.xls',
|
|
25
|
+
'.xlsx',
|
|
26
|
+
'.mp3',
|
|
27
|
+
'.mp4',
|
|
28
|
+
'.avi',
|
|
29
|
+
'.mov',
|
|
30
|
+
'.rss',
|
|
31
|
+
'.atom',
|
|
32
|
+
'.xml',
|
|
33
|
+
];
|
|
34
|
+
const SOCIAL_DOMAINS = [
|
|
35
|
+
'facebook.com',
|
|
36
|
+
'twitter.com',
|
|
37
|
+
'x.com',
|
|
38
|
+
'instagram.com',
|
|
39
|
+
'linkedin.com',
|
|
40
|
+
'youtube.com',
|
|
41
|
+
'tiktok.com',
|
|
42
|
+
'reddit.com',
|
|
43
|
+
'pinterest.com',
|
|
44
|
+
'tumblr.com',
|
|
45
|
+
'weibo.com',
|
|
46
|
+
'zhihu.com',
|
|
47
|
+
];
|
|
48
|
+
const LOW_VALUE_PATTERNS = [
|
|
49
|
+
/\/commit\//i,
|
|
50
|
+
/\/tree\//i,
|
|
51
|
+
/\/blob\//i,
|
|
52
|
+
/\/raw\//i,
|
|
53
|
+
/\/releases\//i,
|
|
54
|
+
/\/compare\//i,
|
|
55
|
+
/\/fork/i,
|
|
56
|
+
/\/stargazers/i,
|
|
57
|
+
/\/watchers/i,
|
|
58
|
+
/\/network/i,
|
|
59
|
+
/\/graphs/i,
|
|
60
|
+
/\/settings/i,
|
|
61
|
+
/\/community/i,
|
|
62
|
+
/\/templates/i,
|
|
63
|
+
/\/milestones/i,
|
|
64
|
+
/\/labels/i,
|
|
65
|
+
/\/assignments/i,
|
|
66
|
+
];
|
|
67
|
+
export async function handleCrawl(command, browser) {
|
|
68
|
+
const page = browser.getPage();
|
|
69
|
+
if (!page) {
|
|
70
|
+
return {
|
|
71
|
+
id: command.id,
|
|
72
|
+
success: false,
|
|
73
|
+
error: 'Browser page not initialized',
|
|
74
|
+
};
|
|
75
|
+
}
|
|
76
|
+
const maxDepth = command.depth ?? 2;
|
|
77
|
+
const maxPages = command.limit ?? 50;
|
|
78
|
+
const format = command.format ?? 'markdown';
|
|
79
|
+
const timeoutMs = (command.timeout ?? 15) * 1000;
|
|
80
|
+
const startUrl = normalizeUrl(command.url);
|
|
81
|
+
const parsedStart = new URL(startUrl);
|
|
82
|
+
const baseOrigin = parsedStart.origin;
|
|
83
|
+
const baseHostname = parsedStart.hostname.replace(/^www\./, '');
|
|
84
|
+
const basePath = parsedStart.pathname.replace(/\/$/, '');
|
|
85
|
+
const visited = new Set();
|
|
86
|
+
const pages = [];
|
|
87
|
+
const pageUrls = new Set();
|
|
88
|
+
let failed = 0;
|
|
89
|
+
const queue = [{ url: startUrl, depth: 0, priority: 0 }];
|
|
90
|
+
function urlPriority(url) {
|
|
91
|
+
for (const p of LOW_VALUE_PATTERNS) {
|
|
92
|
+
if (p.test(url))
|
|
93
|
+
return 10;
|
|
94
|
+
}
|
|
95
|
+
return 0;
|
|
96
|
+
}
|
|
97
|
+
while (queue.length > 0 && pages.length < maxPages) {
|
|
98
|
+
queue.sort((a, b) => a.priority - b.priority || a.depth - b.depth);
|
|
99
|
+
const batch = [];
|
|
100
|
+
while (queue.length > 0 && batch.length < 1 && pages.length + batch.length < maxPages) {
|
|
101
|
+
const entry = queue.shift();
|
|
102
|
+
const normalized = normalizeUrl(entry.url);
|
|
103
|
+
if (visited.has(normalized))
|
|
104
|
+
continue;
|
|
105
|
+
visited.add(normalized);
|
|
106
|
+
batch.push({ ...entry, url: normalized });
|
|
107
|
+
}
|
|
108
|
+
const results = await Promise.allSettled(batch.map((entry) => crawlPage(page, entry.url, baseOrigin, baseHostname, basePath, format, command.selector, timeoutMs)));
|
|
109
|
+
for (let i = 0; i < results.length; i++) {
|
|
110
|
+
const result = results[i];
|
|
111
|
+
const entry = batch[i];
|
|
112
|
+
if (result.status === 'fulfilled' && result.value) {
|
|
113
|
+
const crawlPageData = result.value;
|
|
114
|
+
const finalUrl = normalizeUrl(crawlPageData.url);
|
|
115
|
+
if (pageUrls.has(finalUrl))
|
|
116
|
+
continue;
|
|
117
|
+
pageUrls.add(finalUrl);
|
|
118
|
+
pages.push(crawlPageData);
|
|
119
|
+
if (entry.depth < maxDepth) {
|
|
120
|
+
for (const link of crawlPageData.links || []) {
|
|
121
|
+
const normalized = normalizeUrl(link);
|
|
122
|
+
if (visited.has(normalized))
|
|
123
|
+
continue;
|
|
124
|
+
if (!isAllowedUrl(normalized, baseOrigin, baseHostname, basePath))
|
|
125
|
+
continue;
|
|
126
|
+
if (pages.length + queue.length >= maxPages)
|
|
127
|
+
break;
|
|
128
|
+
queue.push({
|
|
129
|
+
url: normalized,
|
|
130
|
+
depth: entry.depth + 1,
|
|
131
|
+
priority: urlPriority(normalized),
|
|
132
|
+
});
|
|
133
|
+
}
|
|
134
|
+
}
|
|
135
|
+
}
|
|
136
|
+
else {
|
|
137
|
+
failed++;
|
|
138
|
+
}
|
|
139
|
+
}
|
|
140
|
+
}
|
|
141
|
+
return successResponse(command.id, {
|
|
142
|
+
url: startUrl,
|
|
143
|
+
pages,
|
|
144
|
+
total: pages.length,
|
|
145
|
+
crawled: pages.length,
|
|
146
|
+
failed,
|
|
147
|
+
});
|
|
148
|
+
}
|
|
149
|
+
async function crawlPage(page, url, baseOrigin, baseHostname, basePath, format, selector, timeoutMs = 15000) {
|
|
150
|
+
try {
|
|
151
|
+
await page.goto(url, { timeout: timeoutMs, waitUntil: 'domcontentloaded' });
|
|
152
|
+
await page.waitForLoadState('networkidle', { timeout: 5000 }).catch(() => { });
|
|
153
|
+
if (selector) {
|
|
154
|
+
try {
|
|
155
|
+
await page.locator(selector).first().waitFor({ state: 'attached', timeout: 5000 });
|
|
156
|
+
}
|
|
157
|
+
catch {
|
|
158
|
+
// Selector may not exist on all pages
|
|
159
|
+
}
|
|
160
|
+
}
|
|
161
|
+
const [title, content, links] = await Promise.all([
|
|
162
|
+
page.title(),
|
|
163
|
+
extractContentFromPage(page, format, selector),
|
|
164
|
+
discoverLinks(page, baseOrigin, baseHostname, basePath),
|
|
165
|
+
]);
|
|
166
|
+
return { url: page.url(), title, content, links };
|
|
167
|
+
}
|
|
168
|
+
catch (err) {
|
|
169
|
+
const msg = err instanceof Error ? err.message : String(err);
|
|
170
|
+
if (msg.includes('Timeout') || msg.includes('timeout')) {
|
|
171
|
+
try {
|
|
172
|
+
const [title, content] = await Promise.all([
|
|
173
|
+
page.title().catch(() => url),
|
|
174
|
+
extractContentFromPage(page, format, selector).catch(() => ''),
|
|
175
|
+
]);
|
|
176
|
+
const links = await discoverLinks(page, baseOrigin, baseHostname, basePath).catch(() => []);
|
|
177
|
+
return { url: page.url(), title, content, links };
|
|
178
|
+
}
|
|
179
|
+
catch {
|
|
180
|
+
return null;
|
|
181
|
+
}
|
|
182
|
+
}
|
|
183
|
+
return null;
|
|
184
|
+
}
|
|
185
|
+
}
|
|
186
|
+
export async function discoverLinks(page, baseOrigin, baseHostname, basePath) {
|
|
187
|
+
const hrefs = await page.evaluate((origin) => {
|
|
188
|
+
const anchors = document.querySelectorAll('a[href]');
|
|
189
|
+
const results = [];
|
|
190
|
+
anchors.forEach((a) => {
|
|
191
|
+
const href = a.getAttribute('href');
|
|
192
|
+
if (!href)
|
|
193
|
+
return;
|
|
194
|
+
try {
|
|
195
|
+
const fullUrl = new URL(href, origin).href;
|
|
196
|
+
results.push(fullUrl);
|
|
197
|
+
}
|
|
198
|
+
catch {
|
|
199
|
+
// invalid URL
|
|
200
|
+
}
|
|
201
|
+
});
|
|
202
|
+
return results;
|
|
203
|
+
}, baseOrigin);
|
|
204
|
+
const filtered = new Set();
|
|
205
|
+
for (const href of hrefs) {
|
|
206
|
+
try {
|
|
207
|
+
const url = new URL(href);
|
|
208
|
+
if (url.protocol !== 'http:' && url.protocol !== 'https:')
|
|
209
|
+
continue;
|
|
210
|
+
const pathname = url.pathname.toLowerCase();
|
|
211
|
+
if (STATIC_EXTENSIONS.some((ext) => pathname.endsWith(ext)))
|
|
212
|
+
continue;
|
|
213
|
+
const hostname = url.hostname.replace(/^www\./, '');
|
|
214
|
+
if (SOCIAL_DOMAINS.some((d) => hostname === d || hostname.endsWith('.' + d)))
|
|
215
|
+
continue;
|
|
216
|
+
if (hostname !== baseHostname && !hostname.endsWith('.' + baseHostname)) {
|
|
217
|
+
if (url.origin !== baseOrigin)
|
|
218
|
+
continue;
|
|
219
|
+
}
|
|
220
|
+
if (basePath && basePath !== '/') {
|
|
221
|
+
const normalizedBase = basePath.endsWith('/') ? basePath : basePath + '/';
|
|
222
|
+
const urlPath = url.pathname;
|
|
223
|
+
if (urlPath !== basePath && !urlPath.startsWith(normalizedBase))
|
|
224
|
+
continue;
|
|
225
|
+
}
|
|
226
|
+
const normalized = normalizeUrlFromUrl(url);
|
|
227
|
+
if (normalized)
|
|
228
|
+
filtered.add(normalized);
|
|
229
|
+
}
|
|
230
|
+
catch {
|
|
231
|
+
continue;
|
|
232
|
+
}
|
|
233
|
+
}
|
|
234
|
+
return Array.from(filtered);
|
|
235
|
+
}
|
|
236
|
+
function isAllowedUrl(url, baseOrigin, baseHostname, basePath) {
|
|
237
|
+
try {
|
|
238
|
+
const u = new URL(url);
|
|
239
|
+
if (u.protocol !== 'http:' && u.protocol !== 'https:')
|
|
240
|
+
return false;
|
|
241
|
+
const pathname = u.pathname.toLowerCase();
|
|
242
|
+
if (STATIC_EXTENSIONS.some((ext) => pathname.endsWith(ext)))
|
|
243
|
+
return false;
|
|
244
|
+
const hostname = u.hostname.replace(/^www\./, '');
|
|
245
|
+
if (SOCIAL_DOMAINS.some((d) => hostname === d || hostname.endsWith('.' + d)))
|
|
246
|
+
return false;
|
|
247
|
+
if (hostname !== baseHostname &&
|
|
248
|
+
!hostname.endsWith('.' + baseHostname) &&
|
|
249
|
+
u.origin !== baseOrigin) {
|
|
250
|
+
return false;
|
|
251
|
+
}
|
|
252
|
+
if (basePath && basePath !== '/') {
|
|
253
|
+
const normalizedBase = basePath.endsWith('/') ? basePath : basePath + '/';
|
|
254
|
+
const urlPath = u.pathname;
|
|
255
|
+
if (urlPath !== basePath && !urlPath.startsWith(normalizedBase)) {
|
|
256
|
+
return false;
|
|
257
|
+
}
|
|
258
|
+
}
|
|
259
|
+
return true;
|
|
260
|
+
}
|
|
261
|
+
catch {
|
|
262
|
+
return false;
|
|
263
|
+
}
|
|
264
|
+
}
|
|
265
|
+
export function normalizeUrl(url) {
|
|
266
|
+
try {
|
|
267
|
+
const u = new URL(url);
|
|
268
|
+
return normalizeUrlFromUrl(u);
|
|
269
|
+
}
|
|
270
|
+
catch {
|
|
271
|
+
return url;
|
|
272
|
+
}
|
|
273
|
+
}
|
|
274
|
+
export function normalizeUrlFromUrl(u) {
|
|
275
|
+
let pathname = u.pathname;
|
|
276
|
+
if (pathname.length > 1 && pathname.endsWith('/')) {
|
|
277
|
+
pathname = pathname.slice(0, -1);
|
|
278
|
+
}
|
|
279
|
+
const hash = u.hash;
|
|
280
|
+
if (hash && hash.startsWith('#/')) {
|
|
281
|
+
const hashPath = hash.slice(2);
|
|
282
|
+
const cleanHashPath = hashPath.split(/[?#]/)[0];
|
|
283
|
+
if (!cleanHashPath || cleanHashPath === '/') {
|
|
284
|
+
return `${u.origin}${pathname}`;
|
|
285
|
+
}
|
|
286
|
+
return `${u.origin}${pathname}#/${cleanHashPath}`;
|
|
287
|
+
}
|
|
288
|
+
return `${u.origin}${pathname}`;
|
|
289
|
+
}
|
|
290
|
+
//# sourceMappingURL=crawl.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"crawl.js","sourceRoot":"","sources":["../../src/actions/crawl.ts"],"names":[],"mappings":"AAGA,OAAO,EAAE,eAAe,EAAE,MAAM,gBAAgB,CAAC;AACjD,OAAO,EAAkB,sBAAsB,EAAqB,MAAM,YAAY,CAAC;AAEvF,MAAM,iBAAiB,GAAG;IACxB,MAAM;IACN,MAAM;IACN,OAAO;IACP,MAAM;IACN,OAAO;IACP,MAAM;IACN,MAAM;IACN,MAAM;IACN,KAAK;IACL,OAAO;IACP,QAAQ;IACR,MAAM;IACN,MAAM;IACN,MAAM;IACN,MAAM;IACN,KAAK;IACL,MAAM;IACN,MAAM;IACN,MAAM;IACN,OAAO;IACP,MAAM;IACN,OAAO;IACP,MAAM;IACN,MAAM;IACN,MAAM;IACN,MAAM;IACN,MAAM;IACN,OAAO;IACP,MAAM;CACP,CAAC;AAEF,MAAM,cAAc,GAAG;IACrB,cAAc;IACd,aAAa;IACb,OAAO;IACP,eAAe;IACf,cAAc;IACd,aAAa;IACb,YAAY;IACZ,YAAY;IACZ,eAAe;IACf,YAAY;IACZ,WAAW;IACX,WAAW;CACZ,CAAC;AAEF,MAAM,kBAAkB,GAAG;IACzB,aAAa;IACb,WAAW;IACX,WAAW;IACX,UAAU;IACV,eAAe;IACf,cAAc;IACd,SAAS;IACT,eAAe;IACf,aAAa;IACb,YAAY;IACZ,WAAW;IACX,aAAa;IACb,cAAc;IACd,cAAc;IACd,eAAe;IACf,WAAW;IACX,gBAAgB;CACjB,CAAC;AAEF,MAAM,CAAC,KAAK,UAAU,WAAW,CAC/B,OAAqB,EACrB,OAAuB;IAEvB,MAAM,IAAI,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;IAC/B,IAAI,CAAC,IAAI,EAAE,CAAC;QACV,OAAO;YACL,EAAE,EAAE,OAAO,CAAC,EAAE;YACd,OAAO,EAAE,KAAK;YACd,KAAK,EAAE,8BAA8B;SACtC,CAAC;IACJ,CAAC;IAED,MAAM,QAAQ,GAAG,OAAO,CAAC,KAAK,IAAI,CAAC,CAAC;IACpC,MAAM,QAAQ,GAAG,OAAO,CAAC,KAAK,IAAI,EAAE,CAAC;IACrC,MAAM,MAAM,GAAG,OAAO,CAAC,MAAM,IAAI,UAAU,CAAC;IAC5C,MAAM,SAAS,GAAG,CAAC,OAAO,CAAC,OAAO,IAAI,EAAE,CAAC,GAAG,IAAI,CAAC;IAEjD,MAAM,QAAQ,GAAG,YAAY,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC;IAC3C,MAAM,WAAW,GAAG,IAAI,GAAG,CAAC,QAAQ,CAAC,CAAC;IACtC,MAAM,UAAU,GAAG,WAAW,CAAC,MAAM,CAAC;IACtC,MAAM,YAAY,GAAG,WAAW,CAAC,QAAQ,CAAC,OAAO,CAAC,QAAQ,EAAE,EAAE,CAAC,CAAC;IAChE,MAAM,QAAQ,GAAG,WAAW,CAAC,QAAQ,CAAC,OAAO,CAAC,KAAK,EAAE,EAAE,CAAC,CAAC;IACzD,MAAM,OAAO,GAAG,IAAI,GAAG,EAAU,CAAC;IAClC,MAAM,KAAK,GAAgB,EAAE,CAAC;IAC9B,MAAM,QAAQ,GAAG,IAAI,GAAG,EAAU,CAAC;IACnC,IAAI,MAAM,GAAG,CAAC,CAAC;IAGf,MAAM,KAAK,GAAiB,CAAC,EAAE,GAAG,EAAE,QAAQ,EAAE,KAAK,EAAE,CAAC,EAAE,QAAQ,EAAE,CAAC,EAAE,CAAC,CAAC;IAEvE,SAAS,WAAW,CAAC,GAAW;QAC9B,KAAK,MAAM,CAAC,IAAI,kBAAkB,EAAE,CAAC;YACnC,IAAI,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC;gBAAE,OAAO,EAAE,CAAC;QAC7B,CAAC;QACD,OAAO,CAAC,CAAC;IACX,CAAC;IAED,OAAO,KAAK,CAAC,MAAM,GAAG,CAAC,IAAI,KAAK,CAAC,MAAM,GAAG,QAAQ,EAAE,CAAC;QACnD,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,QAAQ,GAAG,CAAC,CAAC,QAAQ,IAAI,CAAC,CAAC,KAAK,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC;QAEnE,MAAM,KAAK,GAAiB,EAAE,CAAC;QAC/B,OAAO,KAAK,CAAC,MAAM,GAAG,CAAC,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC,IAAI,KAAK,CAAC,MAAM,GAAG,KAAK,CAAC,MAAM,GAAG,QAAQ,EAAE,CAAC;YACtF,MAAM,KAAK,GAAG,KAAK,CAAC,KAAK,EAAG,CAAC;YAC7B,MAAM,UAAU,GAAG,YAAY,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;YAC3C,IAAI,OAAO,CAAC,GAAG,CAAC,UAAU,CAAC;gBAAE,SAAS;YACtC,OAAO,CAAC,GAAG,CAAC,UAAU,CAAC,CAAC;YACxB,KAAK,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,GAAG,EAAE,UAAU,EAAE,CAAC,CAAC;QAC5C,CAAC;QAED,MAAM,OAAO,GAAG,MAAM,OAAO,CAAC,UAAU,CACtC,KAAK,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,EAAE,CAClB,SAAS,CACP,IAAI,EACJ,KAAK,CAAC,GAAG,EACT,UAAU,EACV,YAAY,EACZ,QAAQ,EACR,MAAM,EACN,OAAO,CAAC,QAAQ,EAChB,SAAS,CACV,CACF,CACF,CAAC;QAEF,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YACxC,MAAM,MAAM,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC;YAC1B,MAAM,KAAK,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;YAEvB,IAAI,MAAM,CAAC,MAAM,KAAK,WAAW,IAAI,MAAM,CAAC,KAAK,EAAE,CAAC;gBAClD,MAAM,aAAa,GAAG,MAAM,CAAC,KAAK,CAAC;gBACnC,MAAM,QAAQ,GAAG,YAAY,CAAC,aAAa,CAAC,GAAG,CAAC,CAAC;gBACjD,IAAI,QAAQ,CAAC,GAAG,CAAC,QAAQ,CAAC;oBAAE,SAAS;gBACrC,QAAQ,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;gBACvB,KAAK,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;gBAE1B,IAAI,KAAK,CAAC,KAAK,GAAG,QAAQ,EAAE,CAAC;oBAC3B,KAAK,MAAM,IAAI,IAAI,aAAa,CAAC,KAAK,IAAI,EAAE,EAAE,CAAC;wBAC7C,MAAM,UAAU,GAAG,YAAY,CAAC,IAAI,CAAC,CAAC;wBACtC,IAAI,OAAO,CAAC,GAAG,CAAC,UAAU,CAAC;4BAAE,SAAS;wBACtC,IAAI,CAAC,YAAY,CAAC,UAAU,EAAE,UAAU,EAAE,YAAY,EAAE,QAAQ,CAAC;4BAAE,SAAS;wBAC5E,IAAI,KAAK,CAAC,MAAM,GAAG,KAAK,CAAC,MAAM,IAAI,QAAQ;4BAAE,MAAM;wBACnD,KAAK,CAAC,IAAI,CAAC;4BACT,GAAG,EAAE,UAAU;4BACf,KAAK,EAAE,KAAK,CAAC,KAAK,GAAG,CAAC;4BACtB,QAAQ,EAAE,WAAW,CAAC,UAAU,CAAC;yBAClC,CAAC,CAAC;oBACL,CAAC;gBACH,CAAC;YACH,CAAC;iBAAM,CAAC;gBACN,MAAM,EAAE,CAAC;YACX,CAAC;QACH,CAAC;IACH,CAAC;IAED,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE;QACjC,GAAG,EAAE,QAAQ;QACb,KAAK;QACL,KAAK,EAAE,KAAK,CAAC,MAAM;QACnB,OAAO,EAAE,KAAK,CAAC,MAAM;QACrB,MAAM;KACP,CAAC,CAAC;AACL,CAAC;AAED,KAAK,UAAU,SAAS,CACtB,IAAU,EACV,GAAW,EACX,UAAkB,EAClB,YAAoB,EACpB,QAAgB,EAChB,MAAoC,EACpC,QAAiB,EACjB,YAAoB,KAAK;IAEzB,IAAI,CAAC;QACH,MAAM,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,EAAE,OAAO,EAAE,SAAS,EAAE,SAAS,EAAE,kBAAkB,EAAE,CAAC,CAAC;QAE5E,MAAM,IAAI,CAAC,gBAAgB,CAAC,aAAa,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC,KAAK,CAAC,GAAG,EAAE,GAAE,CAAC,CAAC,CAAC;QAE9E,IAAI,QAAQ,EAAE,CAAC;YACb,IAAI,CAAC;gBACH,MAAM,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC,KAAK,EAAE,CAAC,OAAO,CAAC,EAAE,KAAK,EAAE,UAAU,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC;YACrF,CAAC;YAAC,MAAM,CAAC;gBACP,sCAAsC;YACxC,CAAC;QACH,CAAC;QAED,MAAM,CAAC,KAAK,EAAE,OAAO,EAAE,KAAK,CAAC,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;YAChD,IAAI,CAAC,KAAK,EAAE;YACZ,sBAAsB,CAAC,IAAI,EAAE,MAAM,EAAE,QAAQ,CAAC;YAC9C,aAAa,CAAC,IAAI,EAAE,UAAU,EAAE,YAAY,EAAE,QAAQ,CAAC;SACxD,CAAC,CAAC;QAEH,OAAO,EAAE,GAAG,EAAE,IAAI,CAAC,GAAG,EAAE,EAAE,KAAK,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC;IACpD,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,MAAM,GAAG,GAAG,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC;QAC7D,IAAI,GAAG,CAAC,QAAQ,CAAC,SAAS,CAAC,IAAI,GAAG,CAAC,QAAQ,CAAC,SAAS,CAAC,EAAE,CAAC;YACvD,IAAI,CAAC;gBACH,MAAM,CAAC,KAAK,EAAE,OAAO,CAAC,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC;oBACzC,IAAI,CAAC,KAAK,EAAE,CAAC,KAAK,CAAC,GAAG,EAAE,CAAC,GAAG,CAAC;oBAC7B,sBAAsB,CAAC,IAAI,EAAE,MAAM,EAAE,QAAQ,CAAC,CAAC,KAAK,CAAC,GAAG,EAAE,CAAC,EAAE,CAAC;iBAC/D,CAAC,CAAC;gBACH,MAAM,KAAK,GAAG,MAAM,aAAa,CAAC,IAAI,EAAE,UAAU,EAAE,YAAY,EAAE,QAAQ,CAAC,CAAC,KAAK,CAC/E,GAAG,EAAE,CAAC,EAAc,CACrB,CAAC;gBACF,OAAO,EAAE,GAAG,EAAE,IAAI,CAAC,GAAG,EAAE,EAAE,KAAK,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC;YACpD,CAAC;YAAC,MAAM,CAAC;gBACP,OAAO,IAAI,CAAC;YACd,CAAC;QACH,CAAC;QACD,OAAO,IAAI,CAAC;IACd,CAAC;AACH,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,aAAa,CACjC,IAAU,EACV,UAAkB,EAClB,YAAoB,EACpB,QAAgB;IAEhB,MAAM,KAAK,GAAG,MAAM,IAAI,CAAC,QAAQ,CAAC,CAAC,MAAc,EAAE,EAAE;QACnD,MAAM,OAAO,GAAG,QAAQ,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;QACrD,MAAM,OAAO,GAAa,EAAE,CAAC;QAC7B,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,EAAE;YACpB,MAAM,IAAI,GAAG,CAAC,CAAC,YAAY,CAAC,MAAM,CAAC,CAAC;YACpC,IAAI,CAAC,IAAI;gBAAE,OAAO;YAClB,IAAI,CAAC;gBACH,MAAM,OAAO,GAAG,IAAI,GAAG,CAAC,IAAI,EAAE,MAAM,CAAC,CAAC,IAAI,CAAC;gBAC3C,OAAO,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;YACxB,CAAC;YAAC,MAAM,CAAC;gBACP,cAAc;YAChB,CAAC;QACH,CAAC,CAAC,CAAC;QACH,OAAO,OAAO,CAAC;IACjB,CAAC,EAAE,UAAU,CAAC,CAAC;IAEf,MAAM,QAAQ,GAAG,IAAI,GAAG,EAAU,CAAC;IAEnC,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,IAAI,CAAC;YACH,MAAM,GAAG,GAAG,IAAI,GAAG,CAAC,IAAI,CAAC,CAAC;YAE1B,IAAI,GAAG,CAAC,QAAQ,KAAK,OAAO,IAAI,GAAG,CAAC,QAAQ,KAAK,QAAQ;gBAAE,SAAS;YAEpE,MAAM,QAAQ,GAAG,GAAG,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC;YAC5C,IAAI,iBAAiB,CAAC,IAAI,CAAC,CAAC,GAAG,EAAE,EAAE,CAAC,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC;gBAAE,SAAS;YAEtE,MAAM,QAAQ,GAAG,GAAG,CAAC,QAAQ,CAAC,OAAO,CAAC,QAAQ,EAAE,EAAE,CAAC,CAAC;YACpD,IAAI,cAAc,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,QAAQ,KAAK,CAAC,IAAI,QAAQ,CAAC,QAAQ,CAAC,GAAG,GAAG,CAAC,CAAC,CAAC;gBAAE,SAAS;YAEvF,IAAI,QAAQ,KAAK,YAAY,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,GAAG,GAAG,YAAY,CAAC,EAAE,CAAC;gBACxE,IAAI,GAAG,CAAC,MAAM,KAAK,UAAU;oBAAE,SAAS;YAC1C,CAAC;YAED,IAAI,QAAQ,IAAI,QAAQ,KAAK,GAAG,EAAE,CAAC;gBACjC,MAAM,cAAc,GAAG,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,QAAQ,GAAG,GAAG,CAAC;gBAC1E,MAAM,OAAO,GAAG,GAAG,CAAC,QAAQ,CAAC;gBAC7B,IAAI,OAAO,KAAK,QAAQ,IAAI,CAAC,OAAO,CAAC,UAAU,CAAC,cAAc,CAAC;oBAAE,SAAS;YAC5E,CAAC;YAED,MAAM,UAAU,GAAG,mBAAmB,CAAC,GAAG,CAAC,CAAC;YAC5C,IAAI,UAAU;gBAAE,QAAQ,CAAC,GAAG,CAAC,UAAU,CAAC,CAAC;QAC3C,CAAC;QAAC,MAAM,CAAC;YACP,SAAS;QACX,CAAC;IACH,CAAC;IAED,OAAO,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;AAC9B,CAAC;AAED,SAAS,YAAY,CACnB,GAAW,EACX,UAAkB,EAClB,YAAoB,EACpB,QAAgB;IAEhB,IAAI,CAAC;QACH,MAAM,CAAC,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC;QACvB,IAAI,CAAC,CAAC,QAAQ,KAAK,OAAO,IAAI,CAAC,CAAC,QAAQ,KAAK,QAAQ;YAAE,OAAO,KAAK,CAAC;QACpE,MAAM,QAAQ,GAAG,CAAC,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC;QAC1C,IAAI,iBAAiB,CAAC,IAAI,CAAC,CAAC,GAAG,EAAE,EAAE,CAAC,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC;YAAE,OAAO,KAAK,CAAC;QAC1E,MAAM,QAAQ,GAAG,CAAC,CAAC,QAAQ,CAAC,OAAO,CAAC,QAAQ,EAAE,EAAE,CAAC,CAAC;QAClD,IAAI,cAAc,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,QAAQ,KAAK,CAAC,IAAI,QAAQ,CAAC,QAAQ,CAAC,GAAG,GAAG,CAAC,CAAC,CAAC;YAAE,OAAO,KAAK,CAAC;QAE3F,IACE,QAAQ,KAAK,YAAY;YACzB,CAAC,QAAQ,CAAC,QAAQ,CAAC,GAAG,GAAG,YAAY,CAAC;YACtC,CAAC,CAAC,MAAM,KAAK,UAAU,EACvB,CAAC;YACD,OAAO,KAAK,CAAC;QACf,CAAC;QAED,IAAI,QAAQ,IAAI,QAAQ,KAAK,GAAG,EAAE,CAAC;YACjC,MAAM,cAAc,GAAG,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,QAAQ,GAAG,GAAG,CAAC;YAC1E,MAAM,OAAO,GAAG,CAAC,CAAC,QAAQ,CAAC;YAC3B,IAAI,OAAO,KAAK,QAAQ,IAAI,CAAC,OAAO,CAAC,UAAU,CAAC,cAAc,CAAC,EAAE,CAAC;gBAChE,OAAO,KAAK,CAAC;YACf,CAAC;QACH,CAAC;QAED,OAAO,IAAI,CAAC;IACd,CAAC;IAAC,MAAM,CAAC;QACP,OAAO,KAAK,CAAC;IACf,CAAC;AACH,CAAC;AAED,MAAM,UAAU,YAAY,CAAC,GAAW;IACtC,IAAI,CAAC;QACH,MAAM,CAAC,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC;QACvB,OAAO,mBAAmB,CAAC,CAAC,CAAC,CAAC;IAChC,CAAC;IAAC,MAAM,CAAC;QACP,OAAO,GAAG,CAAC;IACb,CAAC;AACH,CAAC;AAED,MAAM,UAAU,mBAAmB,CAAC,CAAM;IACxC,IAAI,QAAQ,GAAG,CAAC,CAAC,QAAQ,CAAC;IAC1B,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,IAAI,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,EAAE,CAAC;QAClD,QAAQ,GAAG,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC;IACnC,CAAC;IACD,MAAM,IAAI,GAAG,CAAC,CAAC,IAAI,CAAC;IACpB,IAAI,IAAI,IAAI,IAAI,CAAC,UAAU,CAAC,IAAI,CAAC,EAAE,CAAC;QAClC,MAAM,QAAQ,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;QAC/B,MAAM,aAAa,GAAG,QAAQ,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC;QAChD,IAAI,CAAC,aAAa,IAAI,aAAa,KAAK,GAAG,EAAE,CAAC;YAC5C,OAAO,GAAG,CAAC,CAAC,MAAM,GAAG,QAAQ,EAAE,CAAC;QAClC,CAAC;QACD,OAAO,GAAG,CAAC,CAAC,MAAM,GAAG,QAAQ,KAAK,aAAa,EAAE,CAAC;IACpD,CAAC;IACD,OAAO,GAAG,CAAC,CAAC,MAAM,GAAG,QAAQ,EAAE,CAAC;AAClC,CAAC"}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import type { BrowserManager } from '../browser/index.js';
|
|
2
|
+
import type { Response, GetAttributeCommand, GetTextCommand, IsVisibleCommand, IsEnabledCommand, IsCheckedCommand, CountCommand, BoundingBoxCommand, StylesCommand, StylesData } from '../types.js';
|
|
3
|
+
export declare function handleGetAttribute(command: GetAttributeCommand, browser: BrowserManager): Promise<Response>;
|
|
4
|
+
export declare function handleGetText(command: GetTextCommand, browser: BrowserManager): Promise<Response>;
|
|
5
|
+
export declare function handleIsVisible(command: IsVisibleCommand, browser: BrowserManager): Promise<Response>;
|
|
6
|
+
export declare function handleIsEnabled(command: IsEnabledCommand, browser: BrowserManager): Promise<Response>;
|
|
7
|
+
export declare function handleIsChecked(command: IsCheckedCommand, browser: BrowserManager): Promise<Response>;
|
|
8
|
+
export declare function handleCount(command: CountCommand, browser: BrowserManager): Promise<Response>;
|
|
9
|
+
export declare function handleBoundingBox(command: BoundingBoxCommand, browser: BrowserManager): Promise<Response>;
|
|
10
|
+
export declare function handleStyles(command: StylesCommand, browser: BrowserManager): Promise<Response<StylesData>>;
|
|
11
|
+
//# sourceMappingURL=elements.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"elements.d.ts","sourceRoot":"","sources":["../../src/actions/elements.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,qBAAqB,CAAC;AAC1D,OAAO,KAAK,EACV,QAAQ,EACR,mBAAmB,EACnB,cAAc,EACd,gBAAgB,EAChB,gBAAgB,EAChB,gBAAgB,EAChB,YAAY,EACZ,kBAAkB,EAClB,aAAa,EACb,UAAU,EACX,MAAM,aAAa,CAAC;AAGrB,wBAAsB,kBAAkB,CACtC,OAAO,EAAE,mBAAmB,EAC5B,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAInB;AAED,wBAAsB,aAAa,CACjC,OAAO,EAAE,cAAc,EACvB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAInB;AAED,wBAAsB,eAAe,CACnC,OAAO,EAAE,gBAAgB,EACzB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAInB;AAED,wBAAsB,eAAe,CACnC,OAAO,EAAE,gBAAgB,EACzB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAInB;AAED,wBAAsB,eAAe,CACnC,OAAO,EAAE,gBAAgB,EACzB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAInB;AAED,wBAAsB,WAAW,CAC/B,OAAO,EAAE,YAAY,EACrB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAInB;AAED,wBAAsB,iBAAiB,CACrC,OAAO,EAAE,kBAAkB,EAC3B,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAInB;AAED,wBAAsB,YAAY,CAChC,OAAO,EAAE,aAAa,EACtB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,UAAU,CAAC,CAAC,CA4C/B"}
|
|
@@ -0,0 +1,78 @@
|
|
|
1
|
+
import { successResponse } from '../protocol.js';
|
|
2
|
+
export async function handleGetAttribute(command, browser) {
|
|
3
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
4
|
+
const value = await locator.getAttribute(command.attribute);
|
|
5
|
+
return successResponse(command.id, { attribute: command.attribute, value });
|
|
6
|
+
}
|
|
7
|
+
export async function handleGetText(command, browser) {
|
|
8
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
9
|
+
const text = await locator.textContent();
|
|
10
|
+
return successResponse(command.id, { text });
|
|
11
|
+
}
|
|
12
|
+
export async function handleIsVisible(command, browser) {
|
|
13
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
14
|
+
const visible = await locator.isVisible({ timeout: 5000 });
|
|
15
|
+
return successResponse(command.id, { visible });
|
|
16
|
+
}
|
|
17
|
+
export async function handleIsEnabled(command, browser) {
|
|
18
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
19
|
+
const enabled = await locator.isEnabled({ timeout: 5000 });
|
|
20
|
+
return successResponse(command.id, { enabled });
|
|
21
|
+
}
|
|
22
|
+
export async function handleIsChecked(command, browser) {
|
|
23
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
24
|
+
const checked = await locator.isChecked({ timeout: 5000 });
|
|
25
|
+
return successResponse(command.id, { checked });
|
|
26
|
+
}
|
|
27
|
+
export async function handleCount(command, browser) {
|
|
28
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
29
|
+
const count = await locator.count();
|
|
30
|
+
return successResponse(command.id, { count });
|
|
31
|
+
}
|
|
32
|
+
export async function handleBoundingBox(command, browser) {
|
|
33
|
+
const locator = browser.getLocator(command.selector, command.inFrame);
|
|
34
|
+
const box = await locator.boundingBox();
|
|
35
|
+
return successResponse(command.id, { box });
|
|
36
|
+
}
|
|
37
|
+
export async function handleStyles(command, browser) {
|
|
38
|
+
const frame = browser.getFrame(command.inFrame);
|
|
39
|
+
const extractStylesScript = `(function(el) {
|
|
40
|
+
const s = getComputedStyle(el);
|
|
41
|
+
const r = el.getBoundingClientRect();
|
|
42
|
+
return {
|
|
43
|
+
tag: el.tagName.toLowerCase(),
|
|
44
|
+
text: el.innerText?.trim().slice(0, 80) || null,
|
|
45
|
+
box: {
|
|
46
|
+
x: Math.round(r.x),
|
|
47
|
+
y: Math.round(r.y),
|
|
48
|
+
width: Math.round(r.width),
|
|
49
|
+
height: Math.round(r.height),
|
|
50
|
+
},
|
|
51
|
+
styles: {
|
|
52
|
+
fontSize: s.fontSize,
|
|
53
|
+
fontWeight: s.fontWeight,
|
|
54
|
+
fontFamily: s.fontFamily.split(',')[0].trim().replace(/"/g, ''),
|
|
55
|
+
color: s.color,
|
|
56
|
+
backgroundColor: s.backgroundColor,
|
|
57
|
+
borderRadius: s.borderRadius,
|
|
58
|
+
border: s.border !== 'none' && s.borderWidth !== '0px' ? s.border : null,
|
|
59
|
+
boxShadow: s.boxShadow !== 'none' ? s.boxShadow : null,
|
|
60
|
+
padding: s.padding,
|
|
61
|
+
},
|
|
62
|
+
};
|
|
63
|
+
})`;
|
|
64
|
+
if (browser.isRef(command.selector)) {
|
|
65
|
+
const locator = browser.getLocator(command.selector);
|
|
66
|
+
const element = (await locator.evaluate((el, script) => {
|
|
67
|
+
const fn = new Function('return ' + script)();
|
|
68
|
+
return fn(el);
|
|
69
|
+
}, extractStylesScript));
|
|
70
|
+
return successResponse(command.id, { elements: [element] });
|
|
71
|
+
}
|
|
72
|
+
const elements = (await frame.locator(command.selector).evaluateAll((els, script) => {
|
|
73
|
+
const fn = new Function('return ' + script)();
|
|
74
|
+
return els.map((el) => fn(el));
|
|
75
|
+
}, extractStylesScript));
|
|
76
|
+
return successResponse(command.id, { elements });
|
|
77
|
+
}
|
|
78
|
+
//# sourceMappingURL=elements.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"elements.js","sourceRoot":"","sources":["../../src/actions/elements.ts"],"names":[],"mappings":"AAaA,OAAO,EAAE,eAAe,EAAE,MAAM,gBAAgB,CAAC;AAEjD,MAAM,CAAC,KAAK,UAAU,kBAAkB,CACtC,OAA4B,EAC5B,OAAuB;IAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IACtE,MAAM,KAAK,GAAG,MAAM,OAAO,CAAC,YAAY,CAAC,OAAO,CAAC,SAAS,CAAC,CAAC;IAC5D,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,SAAS,EAAE,OAAO,CAAC,SAAS,EAAE,KAAK,EAAE,CAAC,CAAC;AAC9E,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,aAAa,CACjC,OAAuB,EACvB,OAAuB;IAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IACtE,MAAM,IAAI,GAAG,MAAM,OAAO,CAAC,WAAW,EAAE,CAAC;IACzC,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,IAAI,EAAE,CAAC,CAAC;AAC/C,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,eAAe,CACnC,OAAyB,EACzB,OAAuB;IAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IACtE,MAAM,OAAO,GAAG,MAAM,OAAO,CAAC,SAAS,CAAC,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC;IAC3D,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,OAAO,EAAE,CAAC,CAAC;AAClD,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,eAAe,CACnC,OAAyB,EACzB,OAAuB;IAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IACtE,MAAM,OAAO,GAAG,MAAM,OAAO,CAAC,SAAS,CAAC,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC;IAC3D,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,OAAO,EAAE,CAAC,CAAC;AAClD,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,eAAe,CACnC,OAAyB,EACzB,OAAuB;IAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IACtE,MAAM,OAAO,GAAG,MAAM,OAAO,CAAC,SAAS,CAAC,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC;IAC3D,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,OAAO,EAAE,CAAC,CAAC;AAClD,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,WAAW,CAC/B,OAAqB,EACrB,OAAuB;IAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IACtE,MAAM,KAAK,GAAG,MAAM,OAAO,CAAC,KAAK,EAAE,CAAC;IACpC,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,KAAK,EAAE,CAAC,CAAC;AAChD,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,iBAAiB,CACrC,OAA2B,EAC3B,OAAuB;IAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,OAAO,CAAC,CAAC;IACtE,MAAM,GAAG,GAAG,MAAM,OAAO,CAAC,WAAW,EAAE,CAAC;IACxC,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;AAC9C,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,YAAY,CAChC,OAAsB,EACtB,OAAuB;IAEvB,MAAM,KAAK,GAAG,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC;IAEhD,MAAM,mBAAmB,GAAG;;;;;;;;;;;;;;;;;;;;;;;;KAwBzB,CAAC;IAEJ,IAAI,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,QAAQ,CAAC,EAAE,CAAC;QACpC,MAAM,OAAO,GAAG,OAAO,CAAC,UAAU,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC;QACrD,MAAM,OAAO,GAAG,CAAC,MAAM,OAAO,CAAC,QAAQ,CAAC,CAAC,EAAE,EAAE,MAAM,EAAE,EAAE;YACrD,MAAM,EAAE,GAAG,IAAI,QAAQ,CAAC,SAAS,GAAG,MAAM,CAAC,EAAE,CAAC;YAC9C,OAAO,EAAE,CAAC,EAAE,CAAC,CAAC;QAChB,CAAC,EAAE,mBAAmB,CAAC,CAA8B,CAAC;QACtD,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,QAAQ,EAAE,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;IAC9D,CAAC;IAED,MAAM,QAAQ,GAAG,CAAC,MAAM,KAAK,CAAC,OAAO,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC,WAAW,CAAC,CAAC,GAAG,EAAE,MAAM,EAAE,EAAE;QAClF,MAAM,EAAE,GAAG,IAAI,QAAQ,CAAC,SAAS,GAAG,MAAM,CAAC,EAAE,CAAC;QAC9C,OAAO,GAAG,CAAC,GAAG,CAAC,CAAC,EAAE,EAAE,EAAE,CAAC,EAAE,CAAC,EAAE,CAAC,CAAC,CAAC;IACjC,CAAC,EAAE,mBAAmB,CAAC,CAA2B,CAAC;IAEnD,OAAO,eAAe,CAAC,OAAO,CAAC,EAAE,EAAE,EAAE,QAAQ,EAAE,CAAC,CAAC;AACnD,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"flow.d.ts","sourceRoot":"","sources":["../../src/actions/flow.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,qBAAqB,CAAC;AAC1D,OAAO,KAAK,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,aAAa,CAAC;AAqCxD,wBAAsB,gBAAgB,CACpC,OAAO,EAAE,UAAU,EACnB,OAAO,EAAE,cAAc,GACtB,OAAO,CAAC,QAAQ,CAAC,CAoBnB"}
|