web-agent-bridge 3.0.0 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (202) hide show
  1. package/LICENSE +72 -21
  2. package/README.ar.md +1286 -1073
  3. package/README.md +1764 -1535
  4. package/bin/agent-runner.js +474 -474
  5. package/bin/cli.js +237 -138
  6. package/bin/wab.js +80 -80
  7. package/examples/bidi-agent.js +119 -119
  8. package/examples/cross-site-agent.js +91 -91
  9. package/examples/mcp-agent.js +94 -94
  10. package/examples/next-app-router/README.md +44 -44
  11. package/examples/puppeteer-agent.js +108 -108
  12. package/examples/saas-dashboard/README.md +55 -55
  13. package/examples/shopify-hydrogen/README.md +74 -74
  14. package/examples/vision-agent.js +171 -171
  15. package/examples/wordpress-elementor/README.md +77 -77
  16. package/package.json +17 -3
  17. package/public/.well-known/agent-tools.json +180 -180
  18. package/public/.well-known/ai-assets.json +59 -59
  19. package/public/.well-known/ai-plugin.json +28 -0
  20. package/public/.well-known/security.txt +8 -0
  21. package/public/agent-workspace.html +349 -347
  22. package/public/ai.html +198 -196
  23. package/public/api.html +413 -0
  24. package/public/browser.html +486 -484
  25. package/public/commander-dashboard.html +243 -243
  26. package/public/cookies.html +210 -208
  27. package/public/css/agent-workspace.css +1713 -1713
  28. package/public/css/premium.css +317 -317
  29. package/public/css/styles.css +1235 -1235
  30. package/public/dashboard.html +706 -704
  31. package/public/demo.html +1770 -1
  32. package/public/dns.html +507 -0
  33. package/public/docs.html +587 -585
  34. package/public/feed.xml +89 -89
  35. package/public/growth.html +463 -0
  36. package/public/index.html +341 -9
  37. package/public/integrations.html +556 -0
  38. package/public/js/agent-workspace.js +1740 -1740
  39. package/public/js/auth-nav.js +31 -31
  40. package/public/js/auth-redirect.js +12 -12
  41. package/public/js/cookie-consent.js +56 -56
  42. package/public/js/wab-demo-page.js +721 -721
  43. package/public/js/ws-client.js +74 -74
  44. package/public/llms-full.txt +360 -309
  45. package/public/llms.txt +125 -86
  46. package/public/login.html +85 -83
  47. package/public/mesh-dashboard.html +328 -328
  48. package/public/openapi.json +580 -580
  49. package/public/phone-shield.html +281 -0
  50. package/public/premium-dashboard.html +2489 -2487
  51. package/public/premium.html +793 -791
  52. package/public/privacy.html +297 -295
  53. package/public/register.html +105 -103
  54. package/public/robots.txt +87 -87
  55. package/public/script/wab-consent.d.ts +36 -36
  56. package/public/script/wab-consent.js +104 -104
  57. package/public/script/wab-schema.js +131 -131
  58. package/public/script/wab.d.ts +108 -108
  59. package/public/script/wab.min.js +580 -580
  60. package/public/security.txt +8 -0
  61. package/public/terms.html +256 -254
  62. package/script/ai-agent-bridge.js +1754 -1754
  63. package/sdk/README.md +99 -99
  64. package/sdk/agent-mesh.js +449 -449
  65. package/sdk/commander.js +262 -262
  66. package/sdk/index.d.ts +464 -464
  67. package/sdk/index.js +18 -1
  68. package/sdk/multi-agent.js +318 -318
  69. package/sdk/package.json +12 -1
  70. package/sdk/safety-shield.js +219 -0
  71. package/sdk/schema-discovery.js +83 -83
  72. package/server/adapters/index.js +520 -520
  73. package/server/config/plans.js +367 -367
  74. package/server/config/secrets.js +102 -102
  75. package/server/control-plane/index.js +301 -301
  76. package/server/data-plane/index.js +354 -354
  77. package/server/index.js +175 -19
  78. package/server/llm/index.js +404 -404
  79. package/server/middleware/adminAuth.js +35 -35
  80. package/server/middleware/auth.js +50 -50
  81. package/server/middleware/featureGate.js +88 -88
  82. package/server/middleware/rateLimits.js +100 -100
  83. package/server/middleware/sensitiveAction.js +157 -0
  84. package/server/migrations/001_add_analytics_indexes.sql +7 -7
  85. package/server/migrations/002_premium_features.sql +418 -418
  86. package/server/migrations/003_ads_integer_cents.sql +33 -33
  87. package/server/migrations/004_agent_os.sql +158 -158
  88. package/server/migrations/005_marketplace_metering.sql +126 -126
  89. package/server/models/adapters/index.js +33 -33
  90. package/server/models/adapters/mysql.js +183 -183
  91. package/server/models/adapters/postgresql.js +172 -172
  92. package/server/models/adapters/sqlite.js +7 -7
  93. package/server/models/db.js +681 -681
  94. package/server/observability/failure-analysis.js +337 -337
  95. package/server/observability/index.js +394 -394
  96. package/server/protocol/capabilities.js +223 -223
  97. package/server/protocol/index.js +243 -243
  98. package/server/protocol/schema.js +584 -584
  99. package/server/registry/certification.js +271 -271
  100. package/server/registry/index.js +326 -326
  101. package/server/routes/admin-premium.js +671 -671
  102. package/server/routes/admin.js +261 -261
  103. package/server/routes/ads.js +130 -130
  104. package/server/routes/agent-workspace.js +540 -378
  105. package/server/routes/api.js +150 -150
  106. package/server/routes/auth.js +71 -71
  107. package/server/routes/billing.js +45 -45
  108. package/server/routes/commander.js +316 -316
  109. package/server/routes/demo-showcase.js +332 -0
  110. package/server/routes/demo-store.js +154 -0
  111. package/server/routes/discovery.js +417 -406
  112. package/server/routes/gateway.js +173 -0
  113. package/server/routes/license.js +251 -240
  114. package/server/routes/mesh.js +469 -469
  115. package/server/routes/noscript.js +543 -543
  116. package/server/routes/premium-v2.js +686 -686
  117. package/server/routes/premium.js +724 -724
  118. package/server/routes/runtime.js +2148 -2147
  119. package/server/routes/sovereign.js +465 -385
  120. package/server/routes/universal.js +200 -177
  121. package/server/routes/wab-api.js +850 -491
  122. package/server/runtime/container-worker.js +111 -111
  123. package/server/runtime/container.js +448 -448
  124. package/server/runtime/distributed-worker.js +362 -362
  125. package/server/runtime/event-bus.js +210 -210
  126. package/server/runtime/index.js +253 -253
  127. package/server/runtime/queue.js +599 -599
  128. package/server/runtime/replay.js +666 -666
  129. package/server/runtime/sandbox.js +266 -266
  130. package/server/runtime/scheduler.js +534 -534
  131. package/server/runtime/session-engine.js +293 -293
  132. package/server/runtime/state-manager.js +188 -188
  133. package/server/security/cross-site-redactor.js +196 -0
  134. package/server/security/dry-run.js +180 -0
  135. package/server/security/human-gate-rate-limit.js +147 -0
  136. package/server/security/human-gate-transports.js +178 -0
  137. package/server/security/human-gate.js +281 -0
  138. package/server/security/index.js +368 -368
  139. package/server/security/intent-engine.js +245 -0
  140. package/server/security/reward-guard.js +171 -0
  141. package/server/security/rollback-store.js +239 -0
  142. package/server/security/token-scope.js +404 -0
  143. package/server/security/url-policy.js +139 -0
  144. package/server/services/agent-chat.js +506 -506
  145. package/server/services/agent-learning.js +601 -575
  146. package/server/services/agent-memory.js +625 -625
  147. package/server/services/agent-mesh.js +555 -539
  148. package/server/services/agent-symphony.js +717 -717
  149. package/server/services/agent-tasks.js +1807 -1807
  150. package/server/services/api-key-engine.js +292 -0
  151. package/server/services/cluster.js +894 -894
  152. package/server/services/commander.js +738 -738
  153. package/server/services/edge-compute.js +440 -440
  154. package/server/services/email.js +204 -204
  155. package/server/services/hosted-runtime.js +205 -205
  156. package/server/services/lfd.js +635 -616
  157. package/server/services/local-ai.js +389 -389
  158. package/server/services/marketplace.js +270 -270
  159. package/server/services/metering.js +182 -182
  160. package/server/services/modules/affiliate-intelligence.js +93 -0
  161. package/server/services/modules/agent-firewall.js +90 -0
  162. package/server/services/modules/bounty.js +89 -0
  163. package/server/services/modules/collective-bargaining.js +92 -0
  164. package/server/services/modules/dark-pattern.js +66 -0
  165. package/server/services/modules/gov-intelligence.js +45 -0
  166. package/server/services/modules/neural.js +55 -0
  167. package/server/services/modules/notary.js +49 -0
  168. package/server/services/modules/price-time-machine.js +86 -0
  169. package/server/services/modules/protocol.js +104 -0
  170. package/server/services/negotiation.js +439 -439
  171. package/server/services/plugins.js +771 -771
  172. package/server/services/premium.js +1 -1
  173. package/server/services/price-intelligence.js +566 -565
  174. package/server/services/price-shield.js +1137 -1137
  175. package/server/services/reputation.js +465 -465
  176. package/server/services/search-engine.js +357 -357
  177. package/server/services/security.js +513 -513
  178. package/server/services/self-healing.js +843 -843
  179. package/server/services/sovereign-shield.js +542 -0
  180. package/server/services/stripe.js +192 -192
  181. package/server/services/swarm.js +788 -788
  182. package/server/services/universal-scraper.js +662 -661
  183. package/server/services/verification.js +481 -481
  184. package/server/services/vision.js +1163 -1163
  185. package/server/utils/cache.js +125 -125
  186. package/server/utils/migrate.js +81 -81
  187. package/server/utils/safe-fetch.js +228 -0
  188. package/server/utils/secureFields.js +50 -50
  189. package/server/ws.js +161 -161
  190. package/templates/artisan-marketplace.yaml +104 -104
  191. package/templates/book-price-scout.yaml +98 -98
  192. package/templates/electronics-price-tracker.yaml +108 -108
  193. package/templates/flight-deal-hunter.yaml +113 -113
  194. package/templates/freelancer-direct.yaml +116 -116
  195. package/templates/grocery-price-compare.yaml +93 -93
  196. package/templates/hotel-direct-booking.yaml +113 -113
  197. package/templates/local-services.yaml +98 -98
  198. package/templates/olive-oil-tunisia.yaml +88 -88
  199. package/templates/organic-farm-fresh.yaml +101 -101
  200. package/templates/restaurant-direct.yaml +97 -97
  201. package/server/services/fairness-engine.js +0 -409
  202. package/server/services/fairness.js +0 -420
@@ -1,357 +1,357 @@
1
- /**
2
- * WAB Search Engine — Independent search aggregator with caching,
3
- * ranking, suggestions, and trending queries.
4
- *
5
- * All results are served under the WAB brand — no external engine
6
- * branding is ever exposed to the user.
7
- */
8
-
9
- const crypto = require('crypto');
10
-
11
- let db;
12
-
13
- function initSearchEngine(database) {
14
- db = database;
15
-
16
- db.exec(`
17
- CREATE TABLE IF NOT EXISTS search_cache (
18
- query_hash TEXT PRIMARY KEY,
19
- query TEXT NOT NULL,
20
- results TEXT NOT NULL,
21
- source TEXT DEFAULT 'multi',
22
- created_at TEXT DEFAULT (datetime('now')),
23
- hit_count INTEGER DEFAULT 1
24
- );
25
-
26
- CREATE TABLE IF NOT EXISTS search_history (
27
- id INTEGER PRIMARY KEY AUTOINCREMENT,
28
- query TEXT NOT NULL,
29
- ip_hash TEXT,
30
- results_count INTEGER DEFAULT 0,
31
- created_at TEXT DEFAULT (datetime('now'))
32
- );
33
-
34
- CREATE TABLE IF NOT EXISTS search_suggestions (
35
- query TEXT PRIMARY KEY,
36
- frequency INTEGER DEFAULT 1,
37
- last_searched TEXT DEFAULT (datetime('now'))
38
- );
39
-
40
- CREATE INDEX IF NOT EXISTS idx_search_cache_created ON search_cache(created_at);
41
- CREATE INDEX IF NOT EXISTS idx_search_history_created ON search_history(created_at);
42
- CREATE INDEX IF NOT EXISTS idx_search_suggestions_freq ON search_suggestions(frequency DESC);
43
- `);
44
- }
45
-
46
- // ─── Cache Layer ──────────────────────────────────────────────────────
47
-
48
- function queryHash(q) {
49
- return crypto.createHash('sha256').update(q.toLowerCase().trim()).digest('hex').slice(0, 32);
50
- }
51
-
52
- function getCachedResults(query) {
53
- const hash = queryHash(query);
54
- const row = db.prepare(
55
- `SELECT results, created_at FROM search_cache WHERE query_hash = ? AND created_at > datetime('now', '-1 hour')`
56
- ).get(hash);
57
- if (row) {
58
- db.prepare(`UPDATE search_cache SET hit_count = hit_count + 1 WHERE query_hash = ?`).run(hash);
59
- return JSON.parse(row.results);
60
- }
61
- return null;
62
- }
63
-
64
- function setCachedResults(query, results, source) {
65
- const hash = queryHash(query);
66
- db.prepare(
67
- `INSERT OR REPLACE INTO search_cache (query_hash, query, results, source, created_at, hit_count)
68
- VALUES (?, ?, ?, ?, datetime('now'), 1)`
69
- ).run(hash, query.toLowerCase().trim(), JSON.stringify(results), source || 'multi');
70
- }
71
-
72
- // Purge old cache entries (>24h)
73
- function purgeOldCache() {
74
- db.prepare(`DELETE FROM search_cache WHERE created_at < datetime('now', '-1 day')`).run();
75
- }
76
-
77
- // ─── Search History & Suggestions ─────────────────────────────────────
78
-
79
- function recordSearch(query, ipHash, resultsCount) {
80
- db.prepare(
81
- `INSERT INTO search_history (query, ip_hash, results_count) VALUES (?, ?, ?)`
82
- ).run(query.trim(), ipHash || null, resultsCount);
83
-
84
- // Update suggestion frequency
85
- const normalized = query.toLowerCase().trim();
86
- if (normalized.length >= 2 && normalized.length <= 100) {
87
- const existing = db.prepare(`SELECT frequency FROM search_suggestions WHERE query = ?`).get(normalized);
88
- if (existing) {
89
- db.prepare(`UPDATE search_suggestions SET frequency = frequency + 1, last_searched = datetime('now') WHERE query = ?`).run(normalized);
90
- } else {
91
- db.prepare(`INSERT INTO search_suggestions (query, frequency) VALUES (?, 1)`).run(normalized);
92
- }
93
- }
94
- }
95
-
96
- function getSuggestions(prefix, limit = 8) {
97
- if (!prefix || prefix.length < 1) return [];
98
- const normalized = prefix.toLowerCase().trim();
99
- return db.prepare(
100
- `SELECT query, frequency FROM search_suggestions
101
- WHERE query LIKE ? AND frequency > 0
102
- ORDER BY frequency DESC, last_searched DESC LIMIT ?`
103
- ).all(normalized + '%', limit).map(r => r.query);
104
- }
105
-
106
- function getTrendingSearches(limit = 10) {
107
- return db.prepare(
108
- `SELECT query, COUNT(*) as count FROM search_history
109
- WHERE created_at > datetime('now', '-24 hours')
110
- GROUP BY LOWER(query) ORDER BY count DESC LIMIT ?`
111
- ).all(limit).map(r => ({ query: r.query, count: r.count }));
112
- }
113
-
114
- function getSearchStats() {
115
- const total = db.prepare(`SELECT COUNT(*) as c FROM search_history`).get().c;
116
- const today = db.prepare(`SELECT COUNT(*) as c FROM search_history WHERE created_at > datetime('now', '-24 hours')`).get().c;
117
- const cached = db.prepare(`SELECT COUNT(*) as c FROM search_cache`).get().c;
118
- const uniqueQueries = db.prepare(`SELECT COUNT(DISTINCT LOWER(query)) as c FROM search_history`).get().c;
119
- return { total, today, cached, uniqueQueries };
120
- }
121
-
122
- // ─── Multi-Source Search ──────────────────────────────────────────────
123
-
124
- const UA = 'Mozilla/5.0 (Linux; Android 13) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36';
125
- const HEADERS = {
126
- 'User-Agent': UA,
127
- 'Accept': 'text/html',
128
- 'Accept-Language': 'en-US,en;q=0.9,ar;q=0.8',
129
- };
130
-
131
- async function searchDDG(q) {
132
- try {
133
- const url = 'https://html.duckduckgo.com/html/?q=' + encodeURIComponent(q);
134
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
135
- const html = await resp.text();
136
- const results = [];
137
- const resultPattern = /<a[^>]+class="result__a"[^>]+href="([^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
138
- const snippetPattern = /<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/gi;
139
- const urls = [], titles = [], snippets = [];
140
- let m;
141
- while ((m = resultPattern.exec(html)) !== null) {
142
- urls.push(m[1]);
143
- titles.push(stripHtml(m[2]));
144
- }
145
- while ((m = snippetPattern.exec(html)) !== null) {
146
- snippets.push(decodeEntities(stripHtml(m[1])));
147
- }
148
- for (let i = 0; i < Math.min(urls.length, 15); i++) {
149
- let u = urls[i];
150
- const uddg = u.match(/uddg=([^&]+)/);
151
- if (uddg) u = decodeURIComponent(uddg[1]);
152
- if (!u.startsWith('http')) continue;
153
- results.push({ title: titles[i] || u, url: u, snippet: snippets[i] || '', source: 'ddg' });
154
- }
155
- return results;
156
- } catch (e) {
157
- return [];
158
- }
159
- }
160
-
161
- async function searchGoogle(q) {
162
- try {
163
- const url = 'https://www.google.com/search?q=' + encodeURIComponent(q) + '&num=15&hl=en';
164
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
165
- const html = await resp.text();
166
- const results = [];
167
- const linkPattern = /<a[^>]+href="\/url\?q=([^&"]+)[^"]*"[^>]*>([\s\S]*?)<\/a>/gi;
168
- let m;
169
- while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
170
- const u = decodeURIComponent(m[1]);
171
- if (!u.startsWith('http')) continue;
172
- try { if (new URL(u).hostname.includes('google.')) continue; } catch { continue; }
173
- const title = stripHtml(m[2]);
174
- if (!title) continue;
175
- results.push({ title, url: u, snippet: '', source: 'google' });
176
- }
177
- return results;
178
- } catch (e) {
179
- return [];
180
- }
181
- }
182
-
183
- async function searchBing(q) {
184
- try {
185
- const url = 'https://www.bing.com/search?q=' + encodeURIComponent(q) + '&count=15';
186
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
187
- const html = await resp.text();
188
- const results = [];
189
- // Bing result links: <a href="URL" h="ID=..."><strong>title</strong></a>
190
- const linkPattern = /<li class="b_algo"[^>]*>[\s\S]*?<a[^>]+href="(https?:\/\/[^"]+)"[^>]*>([\s\S]*?)<\/a>[\s\S]*?<p[^>]*>([\s\S]*?)<\/p>/gi;
191
- let m;
192
- while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
193
- const u = m[1];
194
- if (!u.startsWith('http')) continue;
195
- try { if (new URL(u).hostname.includes('bing.')) continue; } catch { continue; }
196
- const title = stripHtml(m[2]);
197
- const snippet = decodeEntities(stripHtml(m[3]));
198
- if (!title) continue;
199
- results.push({ title, url: u, snippet, source: 'bing' });
200
- }
201
- return results;
202
- } catch (e) {
203
- return [];
204
- }
205
- }
206
-
207
- // ─── Result Ranking Engine ────────────────────────────────────────────
208
-
209
- function rankResults(allResults) {
210
- // Deduplicate by URL (keep the one with the best snippet)
211
- const seen = new Map();
212
- for (const r of allResults) {
213
- const normalizedUrl = normalizeUrl(r.url);
214
- const existing = seen.get(normalizedUrl);
215
- if (!existing) {
216
- seen.set(normalizedUrl, { ...r, sourceCount: 1 });
217
- } else {
218
- existing.sourceCount++;
219
- // Prefer the version with a snippet
220
- if (!existing.snippet && r.snippet) {
221
- existing.snippet = r.snippet;
222
- }
223
- // Prefer longer title
224
- if (r.title.length > existing.title.length) {
225
- existing.title = r.title;
226
- }
227
- }
228
- }
229
-
230
- const deduplicated = Array.from(seen.values());
231
-
232
- // Score each result
233
- for (const r of deduplicated) {
234
- let score = 0;
235
-
236
- // Multi-source bonus: appearing in multiple engines means higher relevance
237
- score += (r.sourceCount - 1) * 30;
238
-
239
- // Snippet presence
240
- if (r.snippet && r.snippet.length > 20) score += 15;
241
-
242
- // HTTPS bonus
243
- if (r.url.startsWith('https://')) score += 5;
244
-
245
- // Domain diversity: boost independent/small sites
246
- const hostname = safeHostname(r.url);
247
- const bigTech = ['google.com','youtube.com','facebook.com','amazon.com','apple.com','microsoft.com','twitter.com','x.com','instagram.com','tiktok.com','linkedin.com','reddit.com','pinterest.com'];
248
- const isBigTech = bigTech.some(d => hostname === d || hostname.endsWith('.' + d));
249
- if (!isBigTech) score += 8;
250
-
251
- // Trusted TLDs
252
- const tld = hostname.split('.').pop();
253
- if (['org','edu','gov','dev'].includes(tld)) score += 5;
254
-
255
- // Penalize very long URLs (likely junk)
256
- if (r.url.length > 200) score -= 10;
257
-
258
- r.score = score;
259
- }
260
-
261
- // Sort by score descending, then by original order
262
- deduplicated.sort((a, b) => b.score - a.score);
263
-
264
- // Return top 15, strip internal fields
265
- return deduplicated.slice(0, 15).map(r => ({
266
- title: r.title,
267
- url: r.url,
268
- snippet: r.snippet || '',
269
- }));
270
- }
271
-
272
- // ─── Main Search Function ─────────────────────────────────────────────
273
-
274
- async function search(query, ipHash) {
275
- if (!query || !query.trim()) return { results: [], cached: false };
276
-
277
- const q = query.trim();
278
-
279
- // Check cache first
280
- const cached = getCachedResults(q);
281
- if (cached && cached.length > 0) {
282
- recordSearch(q, ipHash, cached.length);
283
- return { results: cached, cached: true };
284
- }
285
-
286
- // Fetch from all sources in parallel
287
- const [ddgResults, googleResults, bingResults] = await Promise.allSettled([
288
- searchDDG(q),
289
- searchGoogle(q),
290
- searchBing(q),
291
- ]);
292
-
293
- const allResults = [
294
- ...(ddgResults.status === 'fulfilled' ? ddgResults.value : []),
295
- ...(googleResults.status === 'fulfilled' ? googleResults.value : []),
296
- ...(bingResults.status === 'fulfilled' ? bingResults.value : []),
297
- ];
298
-
299
- if (allResults.length === 0) {
300
- recordSearch(q, ipHash, 0);
301
- return { results: [], cached: false };
302
- }
303
-
304
- // Rank and deduplicate
305
- const ranked = rankResults(allResults);
306
-
307
- // Cache results
308
- setCachedResults(q, ranked, 'multi');
309
-
310
- // Record search
311
- recordSearch(q, ipHash, ranked.length);
312
-
313
- return { results: ranked, cached: false };
314
- }
315
-
316
- // ─── Helpers ──────────────────────────────────────────────────────────
317
-
318
- function stripHtml(s) {
319
- return (s || '').replace(/<[^>]+>/g, '').trim();
320
- }
321
-
322
- function decodeEntities(s) {
323
- return (s || '')
324
- .replace(/&amp;/g, '&')
325
- .replace(/&lt;/g, '<')
326
- .replace(/&gt;/g, '>')
327
- .replace(/&quot;/g, '"')
328
- .replace(/&#x27;/g, "'")
329
- .replace(/&#39;/g, "'")
330
- .trim();
331
- }
332
-
333
- function normalizeUrl(url) {
334
- try {
335
- const u = new URL(url);
336
- return u.hostname.replace(/^www\./, '') + u.pathname.replace(/\/$/, '') + u.search;
337
- } catch {
338
- return url;
339
- }
340
- }
341
-
342
- function safeHostname(url) {
343
- try {
344
- return new URL(url).hostname.replace(/^www\./, '');
345
- } catch {
346
- return '';
347
- }
348
- }
349
-
350
- module.exports = {
351
- initSearchEngine,
352
- search,
353
- getSuggestions,
354
- getTrendingSearches,
355
- getSearchStats,
356
- purgeOldCache,
357
- };
1
+ /**
2
+ * WAB Search Engine — Independent search aggregator with caching,
3
+ * ranking, suggestions, and trending queries.
4
+ *
5
+ * All results are served under the WAB brand — no external engine
6
+ * branding is ever exposed to the user.
7
+ */
8
+
9
+ const crypto = require('crypto');
10
+
11
+ let db;
12
+
13
+ function initSearchEngine(database) {
14
+ db = database;
15
+
16
+ db.exec(`
17
+ CREATE TABLE IF NOT EXISTS search_cache (
18
+ query_hash TEXT PRIMARY KEY,
19
+ query TEXT NOT NULL,
20
+ results TEXT NOT NULL,
21
+ source TEXT DEFAULT 'multi',
22
+ created_at TEXT DEFAULT (datetime('now')),
23
+ hit_count INTEGER DEFAULT 1
24
+ );
25
+
26
+ CREATE TABLE IF NOT EXISTS search_history (
27
+ id INTEGER PRIMARY KEY AUTOINCREMENT,
28
+ query TEXT NOT NULL,
29
+ ip_hash TEXT,
30
+ results_count INTEGER DEFAULT 0,
31
+ created_at TEXT DEFAULT (datetime('now'))
32
+ );
33
+
34
+ CREATE TABLE IF NOT EXISTS search_suggestions (
35
+ query TEXT PRIMARY KEY,
36
+ frequency INTEGER DEFAULT 1,
37
+ last_searched TEXT DEFAULT (datetime('now'))
38
+ );
39
+
40
+ CREATE INDEX IF NOT EXISTS idx_search_cache_created ON search_cache(created_at);
41
+ CREATE INDEX IF NOT EXISTS idx_search_history_created ON search_history(created_at);
42
+ CREATE INDEX IF NOT EXISTS idx_search_suggestions_freq ON search_suggestions(frequency DESC);
43
+ `);
44
+ }
45
+
46
+ // ─── Cache Layer ──────────────────────────────────────────────────────
47
+
48
+ function queryHash(q) {
49
+ return crypto.createHash('sha256').update(q.toLowerCase().trim()).digest('hex').slice(0, 32);
50
+ }
51
+
52
+ function getCachedResults(query) {
53
+ const hash = queryHash(query);
54
+ const row = db.prepare(
55
+ `SELECT results, created_at FROM search_cache WHERE query_hash = ? AND created_at > datetime('now', '-1 hour')`
56
+ ).get(hash);
57
+ if (row) {
58
+ db.prepare(`UPDATE search_cache SET hit_count = hit_count + 1 WHERE query_hash = ?`).run(hash);
59
+ return JSON.parse(row.results);
60
+ }
61
+ return null;
62
+ }
63
+
64
+ function setCachedResults(query, results, source) {
65
+ const hash = queryHash(query);
66
+ db.prepare(
67
+ `INSERT OR REPLACE INTO search_cache (query_hash, query, results, source, created_at, hit_count)
68
+ VALUES (?, ?, ?, ?, datetime('now'), 1)`
69
+ ).run(hash, query.toLowerCase().trim(), JSON.stringify(results), source || 'multi');
70
+ }
71
+
72
+ // Purge old cache entries (>24h)
73
+ function purgeOldCache() {
74
+ db.prepare(`DELETE FROM search_cache WHERE created_at < datetime('now', '-1 day')`).run();
75
+ }
76
+
77
+ // ─── Search History & Suggestions ─────────────────────────────────────
78
+
79
+ function recordSearch(query, ipHash, resultsCount) {
80
+ db.prepare(
81
+ `INSERT INTO search_history (query, ip_hash, results_count) VALUES (?, ?, ?)`
82
+ ).run(query.trim(), ipHash || null, resultsCount);
83
+
84
+ // Update suggestion frequency
85
+ const normalized = query.toLowerCase().trim();
86
+ if (normalized.length >= 2 && normalized.length <= 100) {
87
+ const existing = db.prepare(`SELECT frequency FROM search_suggestions WHERE query = ?`).get(normalized);
88
+ if (existing) {
89
+ db.prepare(`UPDATE search_suggestions SET frequency = frequency + 1, last_searched = datetime('now') WHERE query = ?`).run(normalized);
90
+ } else {
91
+ db.prepare(`INSERT INTO search_suggestions (query, frequency) VALUES (?, 1)`).run(normalized);
92
+ }
93
+ }
94
+ }
95
+
96
+ function getSuggestions(prefix, limit = 8) {
97
+ if (!prefix || prefix.length < 1) return [];
98
+ const normalized = prefix.toLowerCase().trim();
99
+ return db.prepare(
100
+ `SELECT query, frequency FROM search_suggestions
101
+ WHERE query LIKE ? AND frequency > 0
102
+ ORDER BY frequency DESC, last_searched DESC LIMIT ?`
103
+ ).all(normalized + '%', limit).map(r => r.query);
104
+ }
105
+
106
+ function getTrendingSearches(limit = 10) {
107
+ return db.prepare(
108
+ `SELECT query, COUNT(*) as count FROM search_history
109
+ WHERE created_at > datetime('now', '-24 hours')
110
+ GROUP BY LOWER(query) ORDER BY count DESC LIMIT ?`
111
+ ).all(limit).map(r => ({ query: r.query, count: r.count }));
112
+ }
113
+
114
+ function getSearchStats() {
115
+ const total = db.prepare(`SELECT COUNT(*) as c FROM search_history`).get().c;
116
+ const today = db.prepare(`SELECT COUNT(*) as c FROM search_history WHERE created_at > datetime('now', '-24 hours')`).get().c;
117
+ const cached = db.prepare(`SELECT COUNT(*) as c FROM search_cache`).get().c;
118
+ const uniqueQueries = db.prepare(`SELECT COUNT(DISTINCT LOWER(query)) as c FROM search_history`).get().c;
119
+ return { total, today, cached, uniqueQueries };
120
+ }
121
+
122
+ // ─── Multi-Source Search ──────────────────────────────────────────────
123
+
124
+ const UA = 'Mozilla/5.0 (Linux; Android 13) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36';
125
+ const HEADERS = {
126
+ 'User-Agent': UA,
127
+ 'Accept': 'text/html',
128
+ 'Accept-Language': 'en-US,en;q=0.9,ar;q=0.8',
129
+ };
130
+
131
+ async function searchDDG(q) {
132
+ try {
133
+ const url = 'https://html.duckduckgo.com/html/?q=' + encodeURIComponent(q);
134
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
135
+ const html = await resp.text();
136
+ const results = [];
137
+ const resultPattern = /<a[^>]+class="result__a"[^>]+href="([^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
138
+ const snippetPattern = /<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/gi;
139
+ const urls = [], titles = [], snippets = [];
140
+ let m;
141
+ while ((m = resultPattern.exec(html)) !== null) {
142
+ urls.push(m[1]);
143
+ titles.push(stripHtml(m[2]));
144
+ }
145
+ while ((m = snippetPattern.exec(html)) !== null) {
146
+ snippets.push(decodeEntities(stripHtml(m[1])));
147
+ }
148
+ for (let i = 0; i < Math.min(urls.length, 15); i++) {
149
+ let u = urls[i];
150
+ const uddg = u.match(/uddg=([^&]+)/);
151
+ if (uddg) u = decodeURIComponent(uddg[1]);
152
+ if (!u.startsWith('http')) continue;
153
+ results.push({ title: titles[i] || u, url: u, snippet: snippets[i] || '', source: 'ddg' });
154
+ }
155
+ return results;
156
+ } catch (e) {
157
+ return [];
158
+ }
159
+ }
160
+
161
+ async function searchGoogle(q) {
162
+ try {
163
+ const url = 'https://www.google.com/search?q=' + encodeURIComponent(q) + '&num=15&hl=en';
164
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
165
+ const html = await resp.text();
166
+ const results = [];
167
+ const linkPattern = /<a[^>]+href="\/url\?q=([^&"]+)[^"]*"[^>]*>([\s\S]*?)<\/a>/gi;
168
+ let m;
169
+ while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
170
+ const u = decodeURIComponent(m[1]);
171
+ if (!u.startsWith('http')) continue;
172
+ try { if (new URL(u).hostname.includes('google.')) continue; } catch { continue; }
173
+ const title = stripHtml(m[2]);
174
+ if (!title) continue;
175
+ results.push({ title, url: u, snippet: '', source: 'google' });
176
+ }
177
+ return results;
178
+ } catch (e) {
179
+ return [];
180
+ }
181
+ }
182
+
183
+ async function searchBing(q) {
184
+ try {
185
+ const url = 'https://www.bing.com/search?q=' + encodeURIComponent(q) + '&count=15';
186
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
187
+ const html = await resp.text();
188
+ const results = [];
189
+ // Bing result links: <a href="URL" h="ID=..."><strong>title</strong></a>
190
+ const linkPattern = /<li class="b_algo"[^>]*>[\s\S]*?<a[^>]+href="(https?:\/\/[^"]+)"[^>]*>([\s\S]*?)<\/a>[\s\S]*?<p[^>]*>([\s\S]*?)<\/p>/gi;
191
+ let m;
192
+ while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
193
+ const u = m[1];
194
+ if (!u.startsWith('http')) continue;
195
+ try { if (new URL(u).hostname.includes('bing.')) continue; } catch { continue; }
196
+ const title = stripHtml(m[2]);
197
+ const snippet = decodeEntities(stripHtml(m[3]));
198
+ if (!title) continue;
199
+ results.push({ title, url: u, snippet, source: 'bing' });
200
+ }
201
+ return results;
202
+ } catch (e) {
203
+ return [];
204
+ }
205
+ }
206
+
207
+ // ─── Result Ranking Engine ────────────────────────────────────────────
208
+
209
+ function rankResults(allResults) {
210
+ // Deduplicate by URL (keep the one with the best snippet)
211
+ const seen = new Map();
212
+ for (const r of allResults) {
213
+ const normalizedUrl = normalizeUrl(r.url);
214
+ const existing = seen.get(normalizedUrl);
215
+ if (!existing) {
216
+ seen.set(normalizedUrl, { ...r, sourceCount: 1 });
217
+ } else {
218
+ existing.sourceCount++;
219
+ // Prefer the version with a snippet
220
+ if (!existing.snippet && r.snippet) {
221
+ existing.snippet = r.snippet;
222
+ }
223
+ // Prefer longer title
224
+ if (r.title.length > existing.title.length) {
225
+ existing.title = r.title;
226
+ }
227
+ }
228
+ }
229
+
230
+ const deduplicated = Array.from(seen.values());
231
+
232
+ // Score each result
233
+ for (const r of deduplicated) {
234
+ let score = 0;
235
+
236
+ // Multi-source bonus: appearing in multiple engines means higher relevance
237
+ score += (r.sourceCount - 1) * 30;
238
+
239
+ // Snippet presence
240
+ if (r.snippet && r.snippet.length > 20) score += 15;
241
+
242
+ // HTTPS bonus
243
+ if (r.url.startsWith('https://')) score += 5;
244
+
245
+ // Domain diversity: boost independent/small sites
246
+ const hostname = safeHostname(r.url);
247
+ const bigTech = ['google.com','youtube.com','facebook.com','amazon.com','apple.com','microsoft.com','twitter.com','x.com','instagram.com','tiktok.com','linkedin.com','reddit.com','pinterest.com'];
248
+ const isBigTech = bigTech.some(d => hostname === d || hostname.endsWith('.' + d));
249
+ if (!isBigTech) score += 8;
250
+
251
+ // Trusted TLDs
252
+ const tld = hostname.split('.').pop();
253
+ if (['org','edu','gov','dev'].includes(tld)) score += 5;
254
+
255
+ // Penalize very long URLs (likely junk)
256
+ if (r.url.length > 200) score -= 10;
257
+
258
+ r.score = score;
259
+ }
260
+
261
+ // Sort by score descending, then by original order
262
+ deduplicated.sort((a, b) => b.score - a.score);
263
+
264
+ // Return top 15, strip internal fields
265
+ return deduplicated.slice(0, 15).map(r => ({
266
+ title: r.title,
267
+ url: r.url,
268
+ snippet: r.snippet || '',
269
+ }));
270
+ }
271
+
272
+ // ─── Main Search Function ─────────────────────────────────────────────
273
+
274
+ async function search(query, ipHash) {
275
+ if (!query || !query.trim()) return { results: [], cached: false };
276
+
277
+ const q = query.trim();
278
+
279
+ // Check cache first
280
+ const cached = getCachedResults(q);
281
+ if (cached && cached.length > 0) {
282
+ recordSearch(q, ipHash, cached.length);
283
+ return { results: cached, cached: true };
284
+ }
285
+
286
+ // Fetch from all sources in parallel
287
+ const [ddgResults, googleResults, bingResults] = await Promise.allSettled([
288
+ searchDDG(q),
289
+ searchGoogle(q),
290
+ searchBing(q),
291
+ ]);
292
+
293
+ const allResults = [
294
+ ...(ddgResults.status === 'fulfilled' ? ddgResults.value : []),
295
+ ...(googleResults.status === 'fulfilled' ? googleResults.value : []),
296
+ ...(bingResults.status === 'fulfilled' ? bingResults.value : []),
297
+ ];
298
+
299
+ if (allResults.length === 0) {
300
+ recordSearch(q, ipHash, 0);
301
+ return { results: [], cached: false };
302
+ }
303
+
304
+ // Rank and deduplicate
305
+ const ranked = rankResults(allResults);
306
+
307
+ // Cache results
308
+ setCachedResults(q, ranked, 'multi');
309
+
310
+ // Record search
311
+ recordSearch(q, ipHash, ranked.length);
312
+
313
+ return { results: ranked, cached: false };
314
+ }
315
+
316
+ // ─── Helpers ──────────────────────────────────────────────────────────
317
+
318
+ function stripHtml(s) {
319
+ return (s || '').replace(/<[^>]+>/g, '').trim();
320
+ }
321
+
322
+ function decodeEntities(s) {
323
+ return (s || '')
324
+ .replace(/&amp;/g, '&')
325
+ .replace(/&lt;/g, '<')
326
+ .replace(/&gt;/g, '>')
327
+ .replace(/&quot;/g, '"')
328
+ .replace(/&#x27;/g, "'")
329
+ .replace(/&#39;/g, "'")
330
+ .trim();
331
+ }
332
+
333
+ function normalizeUrl(url) {
334
+ try {
335
+ const u = new URL(url);
336
+ return u.hostname.replace(/^www\./, '') + u.pathname.replace(/\/$/, '') + u.search;
337
+ } catch {
338
+ return url;
339
+ }
340
+ }
341
+
342
+ function safeHostname(url) {
343
+ try {
344
+ return new URL(url).hostname.replace(/^www\./, '');
345
+ } catch {
346
+ return '';
347
+ }
348
+ }
349
+
350
+ module.exports = {
351
+ initSearchEngine,
352
+ search,
353
+ getSuggestions,
354
+ getTrendingSearches,
355
+ getSearchStats,
356
+ purgeOldCache,
357
+ };