@apmantza/greedysearch-pi 1.3.0 → 1.4.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +208 -195
- package/cdp.mjs +1 -0
- package/extractors/bing-copilot.mjs +204 -204
- package/extractors/consent.mjs +248 -248
- package/extractors/google-ai.mjs +165 -165
- package/extractors/perplexity.mjs +184 -184
- package/extractors/selectors.mjs +52 -52
- package/index.ts +623 -507
- package/launch.mjs +7 -51
- package/package.json +2 -2
- package/search.mjs +997 -609
- package/skills/greedy-search/SKILL.md +145 -145
- package/test.sh +298 -298
package/extractors/consent.mjs
CHANGED
|
@@ -1,248 +1,248 @@
|
|
|
1
|
-
// consent.mjs — auto-dismiss common cookie/consent banners and human-verification pages
|
|
2
|
-
// Call dismissConsent(tab, cdpFn) after navigating to any page.
|
|
3
|
-
|
|
4
|
-
const CONSENT_JS = `
|
|
5
|
-
(function() {
|
|
6
|
-
// Google consent page (consent.google.com)
|
|
7
|
-
var g = document.querySelector('#L2AGLb, button[jsname="b3VHJd"], .tHlp8d');
|
|
8
|
-
if (g) { g.click(); return 'google'; }
|
|
9
|
-
|
|
10
|
-
// OneTrust (used by many sites including Stack Overflow)
|
|
11
|
-
var ot = document.querySelector('#onetrust-accept-btn-handler, .onetrust-accept-btn-handler');
|
|
12
|
-
if (ot) { ot.click(); return 'onetrust'; }
|
|
13
|
-
|
|
14
|
-
// Generic "accept all" / "agree" buttons
|
|
15
|
-
var btns = Array.from(document.querySelectorAll('button, a[role=button]'));
|
|
16
|
-
var accept = btns.find(b => /^(accept all|accept cookies|agree|i agree|got it|allow all|allow cookies)$/i.test(b.innerText?.trim()));
|
|
17
|
-
if (accept) { accept.click(); return 'generic:' + accept.innerText.trim(); }
|
|
18
|
-
|
|
19
|
-
return null;
|
|
20
|
-
})()
|
|
21
|
-
`;
|
|
22
|
-
|
|
23
|
-
// Detect and auto-click human verification challenges (Google, Microsoft, Cloudflare)
|
|
24
|
-
const VERIFY_DETECT_JS = `
|
|
25
|
-
(function() {
|
|
26
|
-
var url = document.location.href;
|
|
27
|
-
|
|
28
|
-
// --- Google "sorry" page (hard CAPTCHA, can't auto-solve) ---
|
|
29
|
-
if (url.includes('/sorry/') || url.includes('sorry.google')) return 'sorry-page';
|
|
30
|
-
|
|
31
|
-
// --- Microsoft account verification page ---
|
|
32
|
-
if (url.includes('login.microsoftonline.com') || url.includes('login.live.com') || url.includes('account.microsoft.com')) {
|
|
33
|
-
// Look for "Verify" or "Continue" buttons on Microsoft auth pages
|
|
34
|
-
var msBtns = Array.from(document.querySelectorAll('button, input[type=submit], a'));
|
|
35
|
-
var msVerify = msBtns.find(b => /verify|continue|next/i.test(b.innerText?.trim() || b.value || ''));
|
|
36
|
-
if (msVerify) { msVerify.click(); return 'clicked-ms-verify:' + (msVerify.innerText?.trim() || msVerify.value); }
|
|
37
|
-
}
|
|
38
|
-
|
|
39
|
-
// --- Bing Copilot / Microsoft "Verify you're human" interstitial ---
|
|
40
|
-
// Copilot sometimes shows a modal with "Continue" or "Verify" before allowing queries
|
|
41
|
-
if (url.includes('copilot.microsoft.com') || url.includes('bing.com/chat')) {
|
|
42
|
-
// Look for verification modal/dialog
|
|
43
|
-
var modal = document.querySelector('[role="dialog"], .b_modal, .bnp_hfly, [class*="verify"], [class*="challenge"]');
|
|
44
|
-
if (modal) {
|
|
45
|
-
// Find any actionable button in the modal
|
|
46
|
-
var modalBtns = Array.from(modal.querySelectorAll('button, a[role="button"], input[type="submit"]'));
|
|
47
|
-
var actionBtn = modalBtns.find(b => /^(continue|verify|submit|next|i agree|accept|got it)$/i.test(b.innerText?.trim() || b.value || ''));
|
|
48
|
-
if (actionBtn) { actionBtn.click(); return 'clicked-copilot-modal:' + actionBtn.innerText.trim(); }
|
|
49
|
-
}
|
|
50
|
-
|
|
51
|
-
// Check for Turnstile iframe (Copilot uses Cloudflare Turnstile)
|
|
52
|
-
var turnstileIframe = document.querySelector('iframe[src*="challenges.cloudflare.com"], iframe[src*="turnstile"], iframe[title*="challenge"], iframe[title*="Widget"]');
|
|
53
|
-
if (turnstileIframe) {
|
|
54
|
-
// Try clicking the iframe container or nearby checkbox
|
|
55
|
-
var container = turnstileIframe.closest('[class*="turnstile"], [class*="challenge"], [id*="turnstile"]') || turnstileIframe.parentElement;
|
|
56
|
-
if (container) {
|
|
57
|
-
var checkbox = container.querySelector('input[type="checkbox"]');
|
|
58
|
-
if (checkbox && !checkbox.checked) {
|
|
59
|
-
checkbox.click();
|
|
60
|
-
return 'clicked-turnstile-in-iframe';
|
|
61
|
-
}
|
|
62
|
-
// Click the container itself (Turnstile often captures clicks on parent)
|
|
63
|
-
container.click();
|
|
64
|
-
return 'clicked-turnstile-container-near-iframe';
|
|
65
|
-
}
|
|
66
|
-
}
|
|
67
|
-
}
|
|
68
|
-
|
|
69
|
-
// --- Cloudflare Turnstile (used by Copilot and many sites) ---
|
|
70
|
-
// Turnstile widget in iframe
|
|
71
|
-
var turnstileIframe = document.querySelector('iframe[src*="challenges.cloudflare.com"], iframe[src*="turnstile"]');
|
|
72
|
-
if (turnstileIframe) {
|
|
73
|
-
// Try to find and click the checkbox inside the iframe's container
|
|
74
|
-
var turnstileCheckbox = document.querySelector('#cf-turnstile-response, [data-turnstile-callback] input, .cf-turnstile input[type="checkbox"]');
|
|
75
|
-
if (turnstileCheckbox && !turnstileCheckbox.checked) {
|
|
76
|
-
turnstileCheckbox.click();
|
|
77
|
-
return 'clicked-turnstile-checkbox';
|
|
78
|
-
}
|
|
79
|
-
// Try clicking the turnstile container itself (some implementations)
|
|
80
|
-
var turnstileContainer = document.querySelector('.cf-turnstile, [data-sitekey]');
|
|
81
|
-
if (turnstileContainer) {
|
|
82
|
-
turnstileContainer.click();
|
|
83
|
-
return 'clicked-turnstile-container';
|
|
84
|
-
}
|
|
85
|
-
}
|
|
86
|
-
|
|
87
|
-
// --- Cloudflare "Verify you are human" challenge page ---
|
|
88
|
-
if (url.includes('challenges.cloudflare.com') || document.querySelector('#challenge-running, #challenge-stage')) {
|
|
89
|
-
var cfCheckbox = document.querySelector('#cf-stage input[type="checkbox"], .ctp-checkbox-container input');
|
|
90
|
-
if (cfCheckbox) { cfCheckbox.click(); return 'clicked-cloudflare-checkbox'; }
|
|
91
|
-
var cfBtn = document.querySelector('#challenge-form button, .cf-challenge button');
|
|
92
|
-
if (cfBtn) { cfBtn.click(); return 'clicked-cloudflare-button'; }
|
|
93
|
-
}
|
|
94
|
-
|
|
95
|
-
// --- Microsoft "I am human" / "Verify" challenge ---
|
|
96
|
-
// Microsoft uses various verification UIs
|
|
97
|
-
var msHumanBtn = document.querySelector('button[id*="i0"], button[id*="id__"]');
|
|
98
|
-
if (msHumanBtn && /verify|human|robot|continue/i.test(msHumanBtn.innerText?.trim())) {
|
|
99
|
-
msHumanBtn.click();
|
|
100
|
-
return 'clicked-ms-human:' + msHumanBtn.innerText.trim();
|
|
101
|
-
}
|
|
102
|
-
|
|
103
|
-
// --- Generic verification buttons (catch-all) ---
|
|
104
|
-
var btns = Array.from(document.querySelectorAll('button, input[type=submit], a[role=button]'));
|
|
105
|
-
var verify = btns.find(b => /^(verify|verification|verify you are human|i am human|not a robot|continue|proceed)$/i.test(b.innerText?.trim() || b.value || ''));
|
|
106
|
-
if (verify && !document.querySelector('iframe[src*="recaptcha"]')) {
|
|
107
|
-
verify.click();
|
|
108
|
-
return 'clicked-verify:' + (verify.innerText?.trim() || verify.value);
|
|
109
|
-
}
|
|
110
|
-
|
|
111
|
-
// --- Google reCAPTCHA (no image challenge, just checkbox) ---
|
|
112
|
-
var recaptchaCheckbox = document.querySelector('.recaptcha-checkbox-unchecked, input[type=checkbox][id*="recaptcha"]');
|
|
113
|
-
if (recaptchaCheckbox) { recaptchaCheckbox.click(); return 'clicked-recaptcha'; }
|
|
114
|
-
|
|
115
|
-
return null;
|
|
116
|
-
})()
|
|
117
|
-
`;
|
|
118
|
-
|
|
119
|
-
// Retry loop for verification — keeps checking and clicking until page changes or timeout
|
|
120
|
-
const VERIFY_RETRY_JS = `
|
|
121
|
-
(function() {
|
|
122
|
-
var url = document.location.href;
|
|
123
|
-
|
|
124
|
-
// Check if we're still on a verification page
|
|
125
|
-
var isVerifyPage = url.includes('/sorry/') ||
|
|
126
|
-
url.includes('challenges.cloudflare.com') ||
|
|
127
|
-
url.includes('login.microsoftonline.com') ||
|
|
128
|
-
document.querySelector('#challenge-running, #challenge-stage, .cf-turnstile, [role="dialog"]');
|
|
129
|
-
|
|
130
|
-
if (!isVerifyPage) return 'cleared';
|
|
131
|
-
|
|
132
|
-
// Try clicking any verify/continue button again
|
|
133
|
-
var btns = Array.from(document.querySelectorAll('button, input[type=submit], a[role=button]'));
|
|
134
|
-
var btn = btns.find(b => /^(verify|continue|next|i am human|not a robot|submit)$/i.test(b.innerText?.trim() || b.value || ''));
|
|
135
|
-
if (btn) { btn.click(); return 'clicked:' + (btn.innerText?.trim() || btn.value); }
|
|
136
|
-
|
|
137
|
-
// Try Turnstile checkbox
|
|
138
|
-
var cf = document.querySelector('#cf-stage input[type="checkbox"], .cf-turnstile input');
|
|
139
|
-
if (cf && !cf.checked) { cf.click(); return 'clicked-turnstile'; }
|
|
140
|
-
|
|
141
|
-
// Check for modal dialog with continue button (Copilot interstitial)
|
|
142
|
-
var modal = document.querySelector('[role="dialog"], .b_modal, [class*="verify"]');
|
|
143
|
-
if (modal) {
|
|
144
|
-
var modalBtn = modal.querySelector('button, a[role="button"]');
|
|
145
|
-
if (modalBtn) { modalBtn.click(); return 'clicked-modal-btn:' + modalBtn.innerText.trim(); }
|
|
146
|
-
}
|
|
147
|
-
|
|
148
|
-
return 'still-verifying';
|
|
149
|
-
})()
|
|
150
|
-
`;
|
|
151
|
-
|
|
152
|
-
export async function dismissConsent(tab, cdp) {
|
|
153
|
-
const result = await cdp(['eval', tab, CONSENT_JS]).catch(() => null);
|
|
154
|
-
if (result && result !== 'null') {
|
|
155
|
-
await new Promise(r => setTimeout(r, 1500));
|
|
156
|
-
}
|
|
157
|
-
}
|
|
158
|
-
|
|
159
|
-
// Get iframe bounding box for coordinate-based clicking (for cross-origin Turnstile)
|
|
160
|
-
const GET_IFRAME_CENTER_JS = `
|
|
161
|
-
(function() {
|
|
162
|
-
var iframe = document.querySelector('iframe[src*="challenges.cloudflare.com"], iframe[src*="turnstile"], iframe[title*="challenge"], iframe[title*="Widget"]');
|
|
163
|
-
if (!iframe) return null;
|
|
164
|
-
var rect = iframe.getBoundingClientRect();
|
|
165
|
-
// Click near the center-left where the checkbox usually is
|
|
166
|
-
return JSON.stringify({ x: rect.left + 30, y: rect.top + rect.height / 2 });
|
|
167
|
-
})()
|
|
168
|
-
`;
|
|
169
|
-
|
|
170
|
-
// Returns 'clear' | 'clicked' | 'needs-human'
|
|
171
|
-
export async function handleVerification(tab, cdp, waitMs = 60000) {
|
|
172
|
-
const result = await cdp(['eval', tab, VERIFY_DETECT_JS]).catch(() => null);
|
|
173
|
-
|
|
174
|
-
if (!result || result === 'null') return 'clear';
|
|
175
|
-
|
|
176
|
-
// Hard CAPTCHA page — wait for user to solve it manually
|
|
177
|
-
if (result === 'sorry-page') {
|
|
178
|
-
process.stderr.write(`[greedysearch] Google CAPTCHA detected — please solve it in the browser window (waiting up to ${Math.floor(waitMs / 1000)}s)...\n`);
|
|
179
|
-
const deadline = Date.now() + waitMs;
|
|
180
|
-
while (Date.now() < deadline) {
|
|
181
|
-
await new Promise(r => setTimeout(r, 2000));
|
|
182
|
-
const url = await cdp(['eval', tab, 'document.location.href']).catch(() => '');
|
|
183
|
-
if (!url.includes('/sorry/')) return 'cleared-by-user';
|
|
184
|
-
}
|
|
185
|
-
return 'needs-human';
|
|
186
|
-
}
|
|
187
|
-
|
|
188
|
-
// We clicked something — wait for page to update, then keep retrying
|
|
189
|
-
if (result.startsWith('clicked-')) {
|
|
190
|
-
process.stderr.write(`[greedysearch] Clicked verification: ${result}\n`);
|
|
191
|
-
await new Promise(r => setTimeout(r, 2000));
|
|
192
|
-
|
|
193
|
-
// Keep checking if verification cleared, retry clicking for up to waitMs
|
|
194
|
-
const deadline = Date.now() + waitMs;
|
|
195
|
-
while (Date.now() < deadline) {
|
|
196
|
-
const retryResult = await cdp(['eval', tab, VERIFY_RETRY_JS]).catch(() => null);
|
|
197
|
-
|
|
198
|
-
if (retryResult === 'cleared' || !retryResult || retryResult === 'null') {
|
|
199
|
-
process.stderr.write(`[greedysearch] Verification cleared.\n`);
|
|
200
|
-
await new Promise(r => setTimeout(r, 1000));
|
|
201
|
-
return 'clicked';
|
|
202
|
-
}
|
|
203
|
-
|
|
204
|
-
if (retryResult.startsWith('clicked:')) {
|
|
205
|
-
process.stderr.write(`[greedysearch] Retrying verification click...\n`);
|
|
206
|
-
await new Promise(r => setTimeout(r, 2000));
|
|
207
|
-
}
|
|
208
|
-
|
|
209
|
-
// If verification is stuck, try clicking the Turnstile iframe by coordinates
|
|
210
|
-
const iframeCenter = await cdp(['eval', tab, GET_IFRAME_CENTER_JS]).catch(() => null);
|
|
211
|
-
if (iframeCenter && iframeCenter !== 'null') {
|
|
212
|
-
try {
|
|
213
|
-
const { x, y } = JSON.parse(iframeCenter);
|
|
214
|
-
process.stderr.write(`[greedysearch] Trying coordinate click on Turnstile iframe at (${x}, ${y})...\n`);
|
|
215
|
-
await cdp(['clickxy', tab, String(x), String(y)]);
|
|
216
|
-
await new Promise(r => setTimeout(r, 3000));
|
|
217
|
-
} catch {}
|
|
218
|
-
}
|
|
219
|
-
|
|
220
|
-
await new Promise(r => setTimeout(r, 1500));
|
|
221
|
-
}
|
|
222
|
-
|
|
223
|
-
// Still stuck — might need user intervention
|
|
224
|
-
process.stderr.write(`[greedysearch] Verification may require manual intervention.\n`);
|
|
225
|
-
return 'needs-human';
|
|
226
|
-
}
|
|
227
|
-
|
|
228
|
-
// Detection didn't find anything initially, but check for Turnstile iframe with coordinates
|
|
229
|
-
if (result === 'null' || !result) {
|
|
230
|
-
const iframeCenter = await cdp(['eval', tab, GET_IFRAME_CENTER_JS]).catch(() => null);
|
|
231
|
-
if (iframeCenter && iframeCenter !== 'null') {
|
|
232
|
-
process.stderr.write(`[greedysearch] Found Turnstile iframe, attempting coordinate click...\n`);
|
|
233
|
-
try {
|
|
234
|
-
const { x, y } = JSON.parse(iframeCenter);
|
|
235
|
-
await cdp(['clickxy', tab, String(x), String(y)]);
|
|
236
|
-
await new Promise(r => setTimeout(r, 3000));
|
|
237
|
-
|
|
238
|
-
// Check if it worked
|
|
239
|
-
const cleared = await cdp(['eval', tab, VERIFY_RETRY_JS]).catch(() => null);
|
|
240
|
-
if (cleared === 'cleared' || cleared === 'null') {
|
|
241
|
-
return 'clicked';
|
|
242
|
-
}
|
|
243
|
-
} catch {}
|
|
244
|
-
}
|
|
245
|
-
}
|
|
246
|
-
|
|
247
|
-
return 'clear';
|
|
248
|
-
}
|
|
1
|
+
// consent.mjs — auto-dismiss common cookie/consent banners and human-verification pages
|
|
2
|
+
// Call dismissConsent(tab, cdpFn) after navigating to any page.
|
|
3
|
+
|
|
4
|
+
const CONSENT_JS = `
|
|
5
|
+
(function() {
|
|
6
|
+
// Google consent page (consent.google.com)
|
|
7
|
+
var g = document.querySelector('#L2AGLb, button[jsname="b3VHJd"], .tHlp8d');
|
|
8
|
+
if (g) { g.click(); return 'google'; }
|
|
9
|
+
|
|
10
|
+
// OneTrust (used by many sites including Stack Overflow)
|
|
11
|
+
var ot = document.querySelector('#onetrust-accept-btn-handler, .onetrust-accept-btn-handler');
|
|
12
|
+
if (ot) { ot.click(); return 'onetrust'; }
|
|
13
|
+
|
|
14
|
+
// Generic "accept all" / "agree" buttons
|
|
15
|
+
var btns = Array.from(document.querySelectorAll('button, a[role=button]'));
|
|
16
|
+
var accept = btns.find(b => /^(accept all|accept cookies|agree|i agree|got it|allow all|allow cookies)$/i.test(b.innerText?.trim()));
|
|
17
|
+
if (accept) { accept.click(); return 'generic:' + accept.innerText.trim(); }
|
|
18
|
+
|
|
19
|
+
return null;
|
|
20
|
+
})()
|
|
21
|
+
`;
|
|
22
|
+
|
|
23
|
+
// Detect and auto-click human verification challenges (Google, Microsoft, Cloudflare)
|
|
24
|
+
const VERIFY_DETECT_JS = `
|
|
25
|
+
(function() {
|
|
26
|
+
var url = document.location.href;
|
|
27
|
+
|
|
28
|
+
// --- Google "sorry" page (hard CAPTCHA, can't auto-solve) ---
|
|
29
|
+
if (url.includes('/sorry/') || url.includes('sorry.google')) return 'sorry-page';
|
|
30
|
+
|
|
31
|
+
// --- Microsoft account verification page ---
|
|
32
|
+
if (url.includes('login.microsoftonline.com') || url.includes('login.live.com') || url.includes('account.microsoft.com')) {
|
|
33
|
+
// Look for "Verify" or "Continue" buttons on Microsoft auth pages
|
|
34
|
+
var msBtns = Array.from(document.querySelectorAll('button, input[type=submit], a'));
|
|
35
|
+
var msVerify = msBtns.find(b => /verify|continue|next/i.test(b.innerText?.trim() || b.value || ''));
|
|
36
|
+
if (msVerify) { msVerify.click(); return 'clicked-ms-verify:' + (msVerify.innerText?.trim() || msVerify.value); }
|
|
37
|
+
}
|
|
38
|
+
|
|
39
|
+
// --- Bing Copilot / Microsoft "Verify you're human" interstitial ---
|
|
40
|
+
// Copilot sometimes shows a modal with "Continue" or "Verify" before allowing queries
|
|
41
|
+
if (url.includes('copilot.microsoft.com') || url.includes('bing.com/chat')) {
|
|
42
|
+
// Look for verification modal/dialog
|
|
43
|
+
var modal = document.querySelector('[role="dialog"], .b_modal, .bnp_hfly, [class*="verify"], [class*="challenge"]');
|
|
44
|
+
if (modal) {
|
|
45
|
+
// Find any actionable button in the modal
|
|
46
|
+
var modalBtns = Array.from(modal.querySelectorAll('button, a[role="button"], input[type="submit"]'));
|
|
47
|
+
var actionBtn = modalBtns.find(b => /^(continue|verify|submit|next|i agree|accept|got it)$/i.test(b.innerText?.trim() || b.value || ''));
|
|
48
|
+
if (actionBtn) { actionBtn.click(); return 'clicked-copilot-modal:' + actionBtn.innerText.trim(); }
|
|
49
|
+
}
|
|
50
|
+
|
|
51
|
+
// Check for Turnstile iframe (Copilot uses Cloudflare Turnstile)
|
|
52
|
+
var turnstileIframe = document.querySelector('iframe[src*="challenges.cloudflare.com"], iframe[src*="turnstile"], iframe[title*="challenge"], iframe[title*="Widget"]');
|
|
53
|
+
if (turnstileIframe) {
|
|
54
|
+
// Try clicking the iframe container or nearby checkbox
|
|
55
|
+
var container = turnstileIframe.closest('[class*="turnstile"], [class*="challenge"], [id*="turnstile"]') || turnstileIframe.parentElement;
|
|
56
|
+
if (container) {
|
|
57
|
+
var checkbox = container.querySelector('input[type="checkbox"]');
|
|
58
|
+
if (checkbox && !checkbox.checked) {
|
|
59
|
+
checkbox.click();
|
|
60
|
+
return 'clicked-turnstile-in-iframe';
|
|
61
|
+
}
|
|
62
|
+
// Click the container itself (Turnstile often captures clicks on parent)
|
|
63
|
+
container.click();
|
|
64
|
+
return 'clicked-turnstile-container-near-iframe';
|
|
65
|
+
}
|
|
66
|
+
}
|
|
67
|
+
}
|
|
68
|
+
|
|
69
|
+
// --- Cloudflare Turnstile (used by Copilot and many sites) ---
|
|
70
|
+
// Turnstile widget in iframe
|
|
71
|
+
var turnstileIframe = document.querySelector('iframe[src*="challenges.cloudflare.com"], iframe[src*="turnstile"]');
|
|
72
|
+
if (turnstileIframe) {
|
|
73
|
+
// Try to find and click the checkbox inside the iframe's container
|
|
74
|
+
var turnstileCheckbox = document.querySelector('#cf-turnstile-response, [data-turnstile-callback] input, .cf-turnstile input[type="checkbox"]');
|
|
75
|
+
if (turnstileCheckbox && !turnstileCheckbox.checked) {
|
|
76
|
+
turnstileCheckbox.click();
|
|
77
|
+
return 'clicked-turnstile-checkbox';
|
|
78
|
+
}
|
|
79
|
+
// Try clicking the turnstile container itself (some implementations)
|
|
80
|
+
var turnstileContainer = document.querySelector('.cf-turnstile, [data-sitekey]');
|
|
81
|
+
if (turnstileContainer) {
|
|
82
|
+
turnstileContainer.click();
|
|
83
|
+
return 'clicked-turnstile-container';
|
|
84
|
+
}
|
|
85
|
+
}
|
|
86
|
+
|
|
87
|
+
// --- Cloudflare "Verify you are human" challenge page ---
|
|
88
|
+
if (url.includes('challenges.cloudflare.com') || document.querySelector('#challenge-running, #challenge-stage')) {
|
|
89
|
+
var cfCheckbox = document.querySelector('#cf-stage input[type="checkbox"], .ctp-checkbox-container input');
|
|
90
|
+
if (cfCheckbox) { cfCheckbox.click(); return 'clicked-cloudflare-checkbox'; }
|
|
91
|
+
var cfBtn = document.querySelector('#challenge-form button, .cf-challenge button');
|
|
92
|
+
if (cfBtn) { cfBtn.click(); return 'clicked-cloudflare-button'; }
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
// --- Microsoft "I am human" / "Verify" challenge ---
|
|
96
|
+
// Microsoft uses various verification UIs
|
|
97
|
+
var msHumanBtn = document.querySelector('button[id*="i0"], button[id*="id__"]');
|
|
98
|
+
if (msHumanBtn && /verify|human|robot|continue/i.test(msHumanBtn.innerText?.trim())) {
|
|
99
|
+
msHumanBtn.click();
|
|
100
|
+
return 'clicked-ms-human:' + msHumanBtn.innerText.trim();
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
// --- Generic verification buttons (catch-all) ---
|
|
104
|
+
var btns = Array.from(document.querySelectorAll('button, input[type=submit], a[role=button]'));
|
|
105
|
+
var verify = btns.find(b => /^(verify|verification|verify you are human|i am human|not a robot|continue|proceed)$/i.test(b.innerText?.trim() || b.value || ''));
|
|
106
|
+
if (verify && !document.querySelector('iframe[src*="recaptcha"]')) {
|
|
107
|
+
verify.click();
|
|
108
|
+
return 'clicked-verify:' + (verify.innerText?.trim() || verify.value);
|
|
109
|
+
}
|
|
110
|
+
|
|
111
|
+
// --- Google reCAPTCHA (no image challenge, just checkbox) ---
|
|
112
|
+
var recaptchaCheckbox = document.querySelector('.recaptcha-checkbox-unchecked, input[type=checkbox][id*="recaptcha"]');
|
|
113
|
+
if (recaptchaCheckbox) { recaptchaCheckbox.click(); return 'clicked-recaptcha'; }
|
|
114
|
+
|
|
115
|
+
return null;
|
|
116
|
+
})()
|
|
117
|
+
`;
|
|
118
|
+
|
|
119
|
+
// Retry loop for verification — keeps checking and clicking until page changes or timeout
|
|
120
|
+
const VERIFY_RETRY_JS = `
|
|
121
|
+
(function() {
|
|
122
|
+
var url = document.location.href;
|
|
123
|
+
|
|
124
|
+
// Check if we're still on a verification page
|
|
125
|
+
var isVerifyPage = url.includes('/sorry/') ||
|
|
126
|
+
url.includes('challenges.cloudflare.com') ||
|
|
127
|
+
url.includes('login.microsoftonline.com') ||
|
|
128
|
+
document.querySelector('#challenge-running, #challenge-stage, .cf-turnstile, [role="dialog"]');
|
|
129
|
+
|
|
130
|
+
if (!isVerifyPage) return 'cleared';
|
|
131
|
+
|
|
132
|
+
// Try clicking any verify/continue button again
|
|
133
|
+
var btns = Array.from(document.querySelectorAll('button, input[type=submit], a[role=button]'));
|
|
134
|
+
var btn = btns.find(b => /^(verify|continue|next|i am human|not a robot|submit)$/i.test(b.innerText?.trim() || b.value || ''));
|
|
135
|
+
if (btn) { btn.click(); return 'clicked:' + (btn.innerText?.trim() || btn.value); }
|
|
136
|
+
|
|
137
|
+
// Try Turnstile checkbox
|
|
138
|
+
var cf = document.querySelector('#cf-stage input[type="checkbox"], .cf-turnstile input');
|
|
139
|
+
if (cf && !cf.checked) { cf.click(); return 'clicked-turnstile'; }
|
|
140
|
+
|
|
141
|
+
// Check for modal dialog with continue button (Copilot interstitial)
|
|
142
|
+
var modal = document.querySelector('[role="dialog"], .b_modal, [class*="verify"]');
|
|
143
|
+
if (modal) {
|
|
144
|
+
var modalBtn = modal.querySelector('button, a[role="button"]');
|
|
145
|
+
if (modalBtn) { modalBtn.click(); return 'clicked-modal-btn:' + modalBtn.innerText.trim(); }
|
|
146
|
+
}
|
|
147
|
+
|
|
148
|
+
return 'still-verifying';
|
|
149
|
+
})()
|
|
150
|
+
`;
|
|
151
|
+
|
|
152
|
+
export async function dismissConsent(tab, cdp) {
|
|
153
|
+
const result = await cdp(['eval', tab, CONSENT_JS]).catch(() => null);
|
|
154
|
+
if (result && result !== 'null') {
|
|
155
|
+
await new Promise(r => setTimeout(r, 1500));
|
|
156
|
+
}
|
|
157
|
+
}
|
|
158
|
+
|
|
159
|
+
// Get iframe bounding box for coordinate-based clicking (for cross-origin Turnstile)
|
|
160
|
+
const GET_IFRAME_CENTER_JS = `
|
|
161
|
+
(function() {
|
|
162
|
+
var iframe = document.querySelector('iframe[src*="challenges.cloudflare.com"], iframe[src*="turnstile"], iframe[title*="challenge"], iframe[title*="Widget"]');
|
|
163
|
+
if (!iframe) return null;
|
|
164
|
+
var rect = iframe.getBoundingClientRect();
|
|
165
|
+
// Click near the center-left where the checkbox usually is
|
|
166
|
+
return JSON.stringify({ x: rect.left + 30, y: rect.top + rect.height / 2 });
|
|
167
|
+
})()
|
|
168
|
+
`;
|
|
169
|
+
|
|
170
|
+
// Returns 'clear' | 'clicked' | 'needs-human'
|
|
171
|
+
export async function handleVerification(tab, cdp, waitMs = 60000) {
|
|
172
|
+
const result = await cdp(['eval', tab, VERIFY_DETECT_JS]).catch(() => null);
|
|
173
|
+
|
|
174
|
+
if (!result || result === 'null') return 'clear';
|
|
175
|
+
|
|
176
|
+
// Hard CAPTCHA page — wait for user to solve it manually
|
|
177
|
+
if (result === 'sorry-page') {
|
|
178
|
+
process.stderr.write(`[greedysearch] Google CAPTCHA detected — please solve it in the browser window (waiting up to ${Math.floor(waitMs / 1000)}s)...\n`);
|
|
179
|
+
const deadline = Date.now() + waitMs;
|
|
180
|
+
while (Date.now() < deadline) {
|
|
181
|
+
await new Promise(r => setTimeout(r, 2000));
|
|
182
|
+
const url = await cdp(['eval', tab, 'document.location.href']).catch(() => '');
|
|
183
|
+
if (!url.includes('/sorry/')) return 'cleared-by-user';
|
|
184
|
+
}
|
|
185
|
+
return 'needs-human';
|
|
186
|
+
}
|
|
187
|
+
|
|
188
|
+
// We clicked something — wait for page to update, then keep retrying
|
|
189
|
+
if (result.startsWith('clicked-')) {
|
|
190
|
+
process.stderr.write(`[greedysearch] Clicked verification: ${result}\n`);
|
|
191
|
+
await new Promise(r => setTimeout(r, 2000));
|
|
192
|
+
|
|
193
|
+
// Keep checking if verification cleared, retry clicking for up to waitMs
|
|
194
|
+
const deadline = Date.now() + waitMs;
|
|
195
|
+
while (Date.now() < deadline) {
|
|
196
|
+
const retryResult = await cdp(['eval', tab, VERIFY_RETRY_JS]).catch(() => null);
|
|
197
|
+
|
|
198
|
+
if (retryResult === 'cleared' || !retryResult || retryResult === 'null') {
|
|
199
|
+
process.stderr.write(`[greedysearch] Verification cleared.\n`);
|
|
200
|
+
await new Promise(r => setTimeout(r, 1000));
|
|
201
|
+
return 'clicked';
|
|
202
|
+
}
|
|
203
|
+
|
|
204
|
+
if (retryResult.startsWith('clicked:')) {
|
|
205
|
+
process.stderr.write(`[greedysearch] Retrying verification click...\n`);
|
|
206
|
+
await new Promise(r => setTimeout(r, 2000));
|
|
207
|
+
}
|
|
208
|
+
|
|
209
|
+
// If verification is stuck, try clicking the Turnstile iframe by coordinates
|
|
210
|
+
const iframeCenter = await cdp(['eval', tab, GET_IFRAME_CENTER_JS]).catch(() => null);
|
|
211
|
+
if (iframeCenter && iframeCenter !== 'null') {
|
|
212
|
+
try {
|
|
213
|
+
const { x, y } = JSON.parse(iframeCenter);
|
|
214
|
+
process.stderr.write(`[greedysearch] Trying coordinate click on Turnstile iframe at (${x}, ${y})...\n`);
|
|
215
|
+
await cdp(['clickxy', tab, String(x), String(y)]);
|
|
216
|
+
await new Promise(r => setTimeout(r, 3000));
|
|
217
|
+
} catch {}
|
|
218
|
+
}
|
|
219
|
+
|
|
220
|
+
await new Promise(r => setTimeout(r, 1500));
|
|
221
|
+
}
|
|
222
|
+
|
|
223
|
+
// Still stuck — might need user intervention
|
|
224
|
+
process.stderr.write(`[greedysearch] Verification may require manual intervention.\n`);
|
|
225
|
+
return 'needs-human';
|
|
226
|
+
}
|
|
227
|
+
|
|
228
|
+
// Detection didn't find anything initially, but check for Turnstile iframe with coordinates
|
|
229
|
+
if (result === 'null' || !result) {
|
|
230
|
+
const iframeCenter = await cdp(['eval', tab, GET_IFRAME_CENTER_JS]).catch(() => null);
|
|
231
|
+
if (iframeCenter && iframeCenter !== 'null') {
|
|
232
|
+
process.stderr.write(`[greedysearch] Found Turnstile iframe, attempting coordinate click...\n`);
|
|
233
|
+
try {
|
|
234
|
+
const { x, y } = JSON.parse(iframeCenter);
|
|
235
|
+
await cdp(['clickxy', tab, String(x), String(y)]);
|
|
236
|
+
await new Promise(r => setTimeout(r, 3000));
|
|
237
|
+
|
|
238
|
+
// Check if it worked
|
|
239
|
+
const cleared = await cdp(['eval', tab, VERIFY_RETRY_JS]).catch(() => null);
|
|
240
|
+
if (cleared === 'cleared' || cleared === 'null') {
|
|
241
|
+
return 'clicked';
|
|
242
|
+
}
|
|
243
|
+
} catch {}
|
|
244
|
+
}
|
|
245
|
+
}
|
|
246
|
+
|
|
247
|
+
return 'clear';
|
|
248
|
+
}
|