web-agent-bridge 3.2.0 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (202) hide show
  1. package/LICENSE +72 -72
  2. package/README.ar.md +1286 -1152
  3. package/README.md +1764 -1635
  4. package/bin/agent-runner.js +474 -474
  5. package/bin/cli.js +237 -138
  6. package/bin/wab.js +80 -80
  7. package/examples/bidi-agent.js +119 -119
  8. package/examples/cross-site-agent.js +91 -91
  9. package/examples/mcp-agent.js +94 -94
  10. package/examples/next-app-router/README.md +44 -44
  11. package/examples/puppeteer-agent.js +108 -108
  12. package/examples/saas-dashboard/README.md +55 -55
  13. package/examples/shopify-hydrogen/README.md +74 -74
  14. package/examples/vision-agent.js +171 -171
  15. package/examples/wordpress-elementor/README.md +77 -77
  16. package/package.json +16 -3
  17. package/public/.well-known/agent-tools.json +180 -180
  18. package/public/.well-known/ai-assets.json +59 -59
  19. package/public/.well-known/security.txt +8 -0
  20. package/public/agent-workspace.html +349 -349
  21. package/public/ai.html +198 -198
  22. package/public/api.html +413 -412
  23. package/public/browser.html +486 -486
  24. package/public/commander-dashboard.html +243 -243
  25. package/public/cookies.html +210 -210
  26. package/public/css/agent-workspace.css +1713 -1713
  27. package/public/css/premium.css +317 -317
  28. package/public/css/styles.css +1235 -1235
  29. package/public/dashboard.html +706 -706
  30. package/public/dns.html +507 -0
  31. package/public/docs.html +587 -587
  32. package/public/feed.xml +89 -89
  33. package/public/growth.html +463 -463
  34. package/public/index.html +1070 -982
  35. package/public/integrations.html +556 -0
  36. package/public/js/agent-workspace.js +1740 -1740
  37. package/public/js/auth-nav.js +31 -31
  38. package/public/js/auth-redirect.js +12 -12
  39. package/public/js/cookie-consent.js +56 -56
  40. package/public/js/wab-demo-page.js +721 -721
  41. package/public/js/ws-client.js +74 -74
  42. package/public/llms-full.txt +360 -360
  43. package/public/llms.txt +125 -125
  44. package/public/login.html +85 -85
  45. package/public/mesh-dashboard.html +328 -328
  46. package/public/openapi.json +580 -580
  47. package/public/phone-shield.html +281 -0
  48. package/public/premium-dashboard.html +2489 -2489
  49. package/public/premium.html +793 -793
  50. package/public/privacy.html +297 -297
  51. package/public/register.html +105 -105
  52. package/public/robots.txt +87 -87
  53. package/public/script/wab-consent.d.ts +36 -36
  54. package/public/script/wab-consent.js +104 -104
  55. package/public/script/wab-schema.js +131 -131
  56. package/public/script/wab.d.ts +108 -108
  57. package/public/script/wab.min.js +580 -580
  58. package/public/security.txt +8 -0
  59. package/public/terms.html +256 -256
  60. package/script/ai-agent-bridge.js +1754 -1754
  61. package/sdk/README.md +99 -99
  62. package/sdk/agent-mesh.js +449 -449
  63. package/sdk/commander.js +262 -262
  64. package/sdk/index.d.ts +464 -464
  65. package/sdk/index.js +12 -1
  66. package/sdk/multi-agent.js +318 -318
  67. package/sdk/package.json +1 -1
  68. package/sdk/safety-shield.js +219 -0
  69. package/sdk/schema-discovery.js +83 -83
  70. package/server/adapters/index.js +520 -520
  71. package/server/config/plans.js +367 -367
  72. package/server/config/secrets.js +102 -102
  73. package/server/control-plane/index.js +301 -301
  74. package/server/data-plane/index.js +354 -354
  75. package/server/index.js +531 -427
  76. package/server/llm/index.js +404 -404
  77. package/server/middleware/adminAuth.js +35 -35
  78. package/server/middleware/auth.js +50 -50
  79. package/server/middleware/featureGate.js +88 -88
  80. package/server/middleware/rateLimits.js +100 -100
  81. package/server/middleware/sensitiveAction.js +157 -0
  82. package/server/migrations/001_add_analytics_indexes.sql +7 -7
  83. package/server/migrations/002_premium_features.sql +418 -418
  84. package/server/migrations/003_ads_integer_cents.sql +33 -33
  85. package/server/migrations/004_agent_os.sql +158 -158
  86. package/server/migrations/005_marketplace_metering.sql +126 -126
  87. package/server/models/adapters/index.js +33 -33
  88. package/server/models/adapters/mysql.js +183 -183
  89. package/server/models/adapters/postgresql.js +172 -172
  90. package/server/models/adapters/sqlite.js +7 -7
  91. package/server/models/db.js +681 -681
  92. package/server/observability/failure-analysis.js +337 -337
  93. package/server/observability/index.js +394 -394
  94. package/server/protocol/capabilities.js +223 -223
  95. package/server/protocol/index.js +243 -243
  96. package/server/protocol/schema.js +584 -584
  97. package/server/registry/certification.js +271 -271
  98. package/server/registry/index.js +326 -326
  99. package/server/routes/admin-premium.js +671 -671
  100. package/server/routes/admin.js +261 -261
  101. package/server/routes/ads.js +130 -130
  102. package/server/routes/agent-workspace.js +540 -540
  103. package/server/routes/api.js +150 -150
  104. package/server/routes/auth.js +71 -71
  105. package/server/routes/billing.js +45 -45
  106. package/server/routes/commander.js +316 -316
  107. package/server/routes/demo-showcase.js +332 -332
  108. package/server/routes/demo-store.js +154 -0
  109. package/server/routes/discovery.js +417 -417
  110. package/server/routes/gateway.js +173 -157
  111. package/server/routes/license.js +251 -240
  112. package/server/routes/mesh.js +469 -469
  113. package/server/routes/noscript.js +543 -543
  114. package/server/routes/premium-v2.js +686 -686
  115. package/server/routes/premium.js +724 -724
  116. package/server/routes/runtime.js +2148 -2147
  117. package/server/routes/sovereign.js +465 -385
  118. package/server/routes/universal.js +200 -185
  119. package/server/routes/wab-api.js +850 -501
  120. package/server/runtime/container-worker.js +111 -111
  121. package/server/runtime/container.js +448 -448
  122. package/server/runtime/distributed-worker.js +362 -362
  123. package/server/runtime/event-bus.js +210 -210
  124. package/server/runtime/index.js +253 -253
  125. package/server/runtime/queue.js +599 -599
  126. package/server/runtime/replay.js +666 -666
  127. package/server/runtime/sandbox.js +266 -266
  128. package/server/runtime/scheduler.js +534 -534
  129. package/server/runtime/session-engine.js +293 -293
  130. package/server/runtime/state-manager.js +188 -188
  131. package/server/security/cross-site-redactor.js +196 -0
  132. package/server/security/dry-run.js +180 -0
  133. package/server/security/human-gate-rate-limit.js +147 -0
  134. package/server/security/human-gate-transports.js +178 -0
  135. package/server/security/human-gate.js +281 -0
  136. package/server/security/index.js +368 -368
  137. package/server/security/intent-engine.js +245 -0
  138. package/server/security/reward-guard.js +171 -0
  139. package/server/security/rollback-store.js +239 -0
  140. package/server/security/token-scope.js +404 -0
  141. package/server/security/url-policy.js +139 -0
  142. package/server/services/agent-chat.js +506 -506
  143. package/server/services/agent-learning.js +601 -575
  144. package/server/services/agent-memory.js +625 -625
  145. package/server/services/agent-mesh.js +555 -539
  146. package/server/services/agent-symphony.js +717 -717
  147. package/server/services/agent-tasks.js +1807 -1807
  148. package/server/services/api-key-engine.js +292 -261
  149. package/server/services/cluster.js +894 -894
  150. package/server/services/commander.js +738 -738
  151. package/server/services/edge-compute.js +440 -440
  152. package/server/services/email.js +204 -204
  153. package/server/services/hosted-runtime.js +205 -205
  154. package/server/services/lfd.js +635 -635
  155. package/server/services/local-ai.js +389 -389
  156. package/server/services/marketplace.js +270 -270
  157. package/server/services/metering.js +182 -182
  158. package/server/services/modules/affiliate-intelligence.js +93 -93
  159. package/server/services/modules/agent-firewall.js +90 -90
  160. package/server/services/modules/bounty.js +89 -89
  161. package/server/services/modules/collective-bargaining.js +92 -92
  162. package/server/services/modules/dark-pattern.js +66 -66
  163. package/server/services/modules/gov-intelligence.js +45 -45
  164. package/server/services/modules/neural.js +55 -55
  165. package/server/services/modules/notary.js +49 -49
  166. package/server/services/modules/price-time-machine.js +86 -86
  167. package/server/services/modules/protocol.js +104 -104
  168. package/server/services/negotiation.js +439 -439
  169. package/server/services/plugins.js +771 -771
  170. package/server/services/price-intelligence.js +566 -566
  171. package/server/services/price-shield.js +1137 -1137
  172. package/server/services/reputation.js +465 -465
  173. package/server/services/search-engine.js +357 -357
  174. package/server/services/security.js +513 -513
  175. package/server/services/self-healing.js +843 -843
  176. package/server/services/sovereign-shield.js +542 -0
  177. package/server/services/stripe.js +192 -192
  178. package/server/services/swarm.js +788 -788
  179. package/server/services/universal-scraper.js +662 -661
  180. package/server/services/verification.js +481 -481
  181. package/server/services/vision.js +1163 -1163
  182. package/server/utils/cache.js +125 -125
  183. package/server/utils/migrate.js +81 -81
  184. package/server/utils/safe-fetch.js +228 -0
  185. package/server/utils/secureFields.js +50 -50
  186. package/server/ws.js +161 -161
  187. package/templates/artisan-marketplace.yaml +104 -104
  188. package/templates/book-price-scout.yaml +98 -98
  189. package/templates/electronics-price-tracker.yaml +108 -108
  190. package/templates/flight-deal-hunter.yaml +113 -113
  191. package/templates/freelancer-direct.yaml +116 -116
  192. package/templates/grocery-price-compare.yaml +93 -93
  193. package/templates/hotel-direct-booking.yaml +113 -113
  194. package/templates/local-services.yaml +98 -98
  195. package/templates/olive-oil-tunisia.yaml +88 -88
  196. package/templates/organic-farm-fresh.yaml +101 -101
  197. package/templates/restaurant-direct.yaml +97 -97
  198. package/public/score.html +0 -263
  199. package/server/migrations/006_growth_suite.sql +0 -138
  200. package/server/routes/growth.js +0 -962
  201. package/server/services/fairness-engine.js +0 -409
  202. package/server/services/fairness.js +0 -420
@@ -1,357 +1,357 @@
1
- /**
2
- * WAB Search Engine — Independent search aggregator with caching,
3
- * ranking, suggestions, and trending queries.
4
- *
5
- * All results are served under the WAB brand — no external engine
6
- * branding is ever exposed to the user.
7
- */
8
-
9
- const crypto = require('crypto');
10
-
11
- let db;
12
-
13
- function initSearchEngine(database) {
14
- db = database;
15
-
16
- db.exec(`
17
- CREATE TABLE IF NOT EXISTS search_cache (
18
- query_hash TEXT PRIMARY KEY,
19
- query TEXT NOT NULL,
20
- results TEXT NOT NULL,
21
- source TEXT DEFAULT 'multi',
22
- created_at TEXT DEFAULT (datetime('now')),
23
- hit_count INTEGER DEFAULT 1
24
- );
25
-
26
- CREATE TABLE IF NOT EXISTS search_history (
27
- id INTEGER PRIMARY KEY AUTOINCREMENT,
28
- query TEXT NOT NULL,
29
- ip_hash TEXT,
30
- results_count INTEGER DEFAULT 0,
31
- created_at TEXT DEFAULT (datetime('now'))
32
- );
33
-
34
- CREATE TABLE IF NOT EXISTS search_suggestions (
35
- query TEXT PRIMARY KEY,
36
- frequency INTEGER DEFAULT 1,
37
- last_searched TEXT DEFAULT (datetime('now'))
38
- );
39
-
40
- CREATE INDEX IF NOT EXISTS idx_search_cache_created ON search_cache(created_at);
41
- CREATE INDEX IF NOT EXISTS idx_search_history_created ON search_history(created_at);
42
- CREATE INDEX IF NOT EXISTS idx_search_suggestions_freq ON search_suggestions(frequency DESC);
43
- `);
44
- }
45
-
46
- // ─── Cache Layer ──────────────────────────────────────────────────────
47
-
48
- function queryHash(q) {
49
- return crypto.createHash('sha256').update(q.toLowerCase().trim()).digest('hex').slice(0, 32);
50
- }
51
-
52
- function getCachedResults(query) {
53
- const hash = queryHash(query);
54
- const row = db.prepare(
55
- `SELECT results, created_at FROM search_cache WHERE query_hash = ? AND created_at > datetime('now', '-1 hour')`
56
- ).get(hash);
57
- if (row) {
58
- db.prepare(`UPDATE search_cache SET hit_count = hit_count + 1 WHERE query_hash = ?`).run(hash);
59
- return JSON.parse(row.results);
60
- }
61
- return null;
62
- }
63
-
64
- function setCachedResults(query, results, source) {
65
- const hash = queryHash(query);
66
- db.prepare(
67
- `INSERT OR REPLACE INTO search_cache (query_hash, query, results, source, created_at, hit_count)
68
- VALUES (?, ?, ?, ?, datetime('now'), 1)`
69
- ).run(hash, query.toLowerCase().trim(), JSON.stringify(results), source || 'multi');
70
- }
71
-
72
- // Purge old cache entries (>24h)
73
- function purgeOldCache() {
74
- db.prepare(`DELETE FROM search_cache WHERE created_at < datetime('now', '-1 day')`).run();
75
- }
76
-
77
- // ─── Search History & Suggestions ─────────────────────────────────────
78
-
79
- function recordSearch(query, ipHash, resultsCount) {
80
- db.prepare(
81
- `INSERT INTO search_history (query, ip_hash, results_count) VALUES (?, ?, ?)`
82
- ).run(query.trim(), ipHash || null, resultsCount);
83
-
84
- // Update suggestion frequency
85
- const normalized = query.toLowerCase().trim();
86
- if (normalized.length >= 2 && normalized.length <= 100) {
87
- const existing = db.prepare(`SELECT frequency FROM search_suggestions WHERE query = ?`).get(normalized);
88
- if (existing) {
89
- db.prepare(`UPDATE search_suggestions SET frequency = frequency + 1, last_searched = datetime('now') WHERE query = ?`).run(normalized);
90
- } else {
91
- db.prepare(`INSERT INTO search_suggestions (query, frequency) VALUES (?, 1)`).run(normalized);
92
- }
93
- }
94
- }
95
-
96
- function getSuggestions(prefix, limit = 8) {
97
- if (!prefix || prefix.length < 1) return [];
98
- const normalized = prefix.toLowerCase().trim();
99
- return db.prepare(
100
- `SELECT query, frequency FROM search_suggestions
101
- WHERE query LIKE ? AND frequency > 0
102
- ORDER BY frequency DESC, last_searched DESC LIMIT ?`
103
- ).all(normalized + '%', limit).map(r => r.query);
104
- }
105
-
106
- function getTrendingSearches(limit = 10) {
107
- return db.prepare(
108
- `SELECT query, COUNT(*) as count FROM search_history
109
- WHERE created_at > datetime('now', '-24 hours')
110
- GROUP BY LOWER(query) ORDER BY count DESC LIMIT ?`
111
- ).all(limit).map(r => ({ query: r.query, count: r.count }));
112
- }
113
-
114
- function getSearchStats() {
115
- const total = db.prepare(`SELECT COUNT(*) as c FROM search_history`).get().c;
116
- const today = db.prepare(`SELECT COUNT(*) as c FROM search_history WHERE created_at > datetime('now', '-24 hours')`).get().c;
117
- const cached = db.prepare(`SELECT COUNT(*) as c FROM search_cache`).get().c;
118
- const uniqueQueries = db.prepare(`SELECT COUNT(DISTINCT LOWER(query)) as c FROM search_history`).get().c;
119
- return { total, today, cached, uniqueQueries };
120
- }
121
-
122
- // ─── Multi-Source Search ──────────────────────────────────────────────
123
-
124
- const UA = 'Mozilla/5.0 (Linux; Android 13) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36';
125
- const HEADERS = {
126
- 'User-Agent': UA,
127
- 'Accept': 'text/html',
128
- 'Accept-Language': 'en-US,en;q=0.9,ar;q=0.8',
129
- };
130
-
131
- async function searchDDG(q) {
132
- try {
133
- const url = 'https://html.duckduckgo.com/html/?q=' + encodeURIComponent(q);
134
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
135
- const html = await resp.text();
136
- const results = [];
137
- const resultPattern = /<a[^>]+class="result__a"[^>]+href="([^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
138
- const snippetPattern = /<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/gi;
139
- const urls = [], titles = [], snippets = [];
140
- let m;
141
- while ((m = resultPattern.exec(html)) !== null) {
142
- urls.push(m[1]);
143
- titles.push(stripHtml(m[2]));
144
- }
145
- while ((m = snippetPattern.exec(html)) !== null) {
146
- snippets.push(decodeEntities(stripHtml(m[1])));
147
- }
148
- for (let i = 0; i < Math.min(urls.length, 15); i++) {
149
- let u = urls[i];
150
- const uddg = u.match(/uddg=([^&]+)/);
151
- if (uddg) u = decodeURIComponent(uddg[1]);
152
- if (!u.startsWith('http')) continue;
153
- results.push({ title: titles[i] || u, url: u, snippet: snippets[i] || '', source: 'ddg' });
154
- }
155
- return results;
156
- } catch (e) {
157
- return [];
158
- }
159
- }
160
-
161
- async function searchGoogle(q) {
162
- try {
163
- const url = 'https://www.google.com/search?q=' + encodeURIComponent(q) + '&num=15&hl=en';
164
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
165
- const html = await resp.text();
166
- const results = [];
167
- const linkPattern = /<a[^>]+href="\/url\?q=([^&"]+)[^"]*"[^>]*>([\s\S]*?)<\/a>/gi;
168
- let m;
169
- while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
170
- const u = decodeURIComponent(m[1]);
171
- if (!u.startsWith('http')) continue;
172
- try { if (new URL(u).hostname.includes('google.')) continue; } catch { continue; }
173
- const title = stripHtml(m[2]);
174
- if (!title) continue;
175
- results.push({ title, url: u, snippet: '', source: 'google' });
176
- }
177
- return results;
178
- } catch (e) {
179
- return [];
180
- }
181
- }
182
-
183
- async function searchBing(q) {
184
- try {
185
- const url = 'https://www.bing.com/search?q=' + encodeURIComponent(q) + '&count=15';
186
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
187
- const html = await resp.text();
188
- const results = [];
189
- // Bing result links: <a href="URL" h="ID=..."><strong>title</strong></a>
190
- const linkPattern = /<li class="b_algo"[^>]*>[\s\S]*?<a[^>]+href="(https?:\/\/[^"]+)"[^>]*>([\s\S]*?)<\/a>[\s\S]*?<p[^>]*>([\s\S]*?)<\/p>/gi;
191
- let m;
192
- while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
193
- const u = m[1];
194
- if (!u.startsWith('http')) continue;
195
- try { if (new URL(u).hostname.includes('bing.')) continue; } catch { continue; }
196
- const title = stripHtml(m[2]);
197
- const snippet = decodeEntities(stripHtml(m[3]));
198
- if (!title) continue;
199
- results.push({ title, url: u, snippet, source: 'bing' });
200
- }
201
- return results;
202
- } catch (e) {
203
- return [];
204
- }
205
- }
206
-
207
- // ─── Result Ranking Engine ────────────────────────────────────────────
208
-
209
- function rankResults(allResults) {
210
- // Deduplicate by URL (keep the one with the best snippet)
211
- const seen = new Map();
212
- for (const r of allResults) {
213
- const normalizedUrl = normalizeUrl(r.url);
214
- const existing = seen.get(normalizedUrl);
215
- if (!existing) {
216
- seen.set(normalizedUrl, { ...r, sourceCount: 1 });
217
- } else {
218
- existing.sourceCount++;
219
- // Prefer the version with a snippet
220
- if (!existing.snippet && r.snippet) {
221
- existing.snippet = r.snippet;
222
- }
223
- // Prefer longer title
224
- if (r.title.length > existing.title.length) {
225
- existing.title = r.title;
226
- }
227
- }
228
- }
229
-
230
- const deduplicated = Array.from(seen.values());
231
-
232
- // Score each result
233
- for (const r of deduplicated) {
234
- let score = 0;
235
-
236
- // Multi-source bonus: appearing in multiple engines means higher relevance
237
- score += (r.sourceCount - 1) * 30;
238
-
239
- // Snippet presence
240
- if (r.snippet && r.snippet.length > 20) score += 15;
241
-
242
- // HTTPS bonus
243
- if (r.url.startsWith('https://')) score += 5;
244
-
245
- // Domain diversity: boost independent/small sites
246
- const hostname = safeHostname(r.url);
247
- const bigTech = ['google.com','youtube.com','facebook.com','amazon.com','apple.com','microsoft.com','twitter.com','x.com','instagram.com','tiktok.com','linkedin.com','reddit.com','pinterest.com'];
248
- const isBigTech = bigTech.some(d => hostname === d || hostname.endsWith('.' + d));
249
- if (!isBigTech) score += 8;
250
-
251
- // Trusted TLDs
252
- const tld = hostname.split('.').pop();
253
- if (['org','edu','gov','dev'].includes(tld)) score += 5;
254
-
255
- // Penalize very long URLs (likely junk)
256
- if (r.url.length > 200) score -= 10;
257
-
258
- r.score = score;
259
- }
260
-
261
- // Sort by score descending, then by original order
262
- deduplicated.sort((a, b) => b.score - a.score);
263
-
264
- // Return top 15, strip internal fields
265
- return deduplicated.slice(0, 15).map(r => ({
266
- title: r.title,
267
- url: r.url,
268
- snippet: r.snippet || '',
269
- }));
270
- }
271
-
272
- // ─── Main Search Function ─────────────────────────────────────────────
273
-
274
- async function search(query, ipHash) {
275
- if (!query || !query.trim()) return { results: [], cached: false };
276
-
277
- const q = query.trim();
278
-
279
- // Check cache first
280
- const cached = getCachedResults(q);
281
- if (cached && cached.length > 0) {
282
- recordSearch(q, ipHash, cached.length);
283
- return { results: cached, cached: true };
284
- }
285
-
286
- // Fetch from all sources in parallel
287
- const [ddgResults, googleResults, bingResults] = await Promise.allSettled([
288
- searchDDG(q),
289
- searchGoogle(q),
290
- searchBing(q),
291
- ]);
292
-
293
- const allResults = [
294
- ...(ddgResults.status === 'fulfilled' ? ddgResults.value : []),
295
- ...(googleResults.status === 'fulfilled' ? googleResults.value : []),
296
- ...(bingResults.status === 'fulfilled' ? bingResults.value : []),
297
- ];
298
-
299
- if (allResults.length === 0) {
300
- recordSearch(q, ipHash, 0);
301
- return { results: [], cached: false };
302
- }
303
-
304
- // Rank and deduplicate
305
- const ranked = rankResults(allResults);
306
-
307
- // Cache results
308
- setCachedResults(q, ranked, 'multi');
309
-
310
- // Record search
311
- recordSearch(q, ipHash, ranked.length);
312
-
313
- return { results: ranked, cached: false };
314
- }
315
-
316
- // ─── Helpers ──────────────────────────────────────────────────────────
317
-
318
- function stripHtml(s) {
319
- return (s || '').replace(/<[^>]+>/g, '').trim();
320
- }
321
-
322
- function decodeEntities(s) {
323
- return (s || '')
324
- .replace(/&amp;/g, '&')
325
- .replace(/&lt;/g, '<')
326
- .replace(/&gt;/g, '>')
327
- .replace(/&quot;/g, '"')
328
- .replace(/&#x27;/g, "'")
329
- .replace(/&#39;/g, "'")
330
- .trim();
331
- }
332
-
333
- function normalizeUrl(url) {
334
- try {
335
- const u = new URL(url);
336
- return u.hostname.replace(/^www\./, '') + u.pathname.replace(/\/$/, '') + u.search;
337
- } catch {
338
- return url;
339
- }
340
- }
341
-
342
- function safeHostname(url) {
343
- try {
344
- return new URL(url).hostname.replace(/^www\./, '');
345
- } catch {
346
- return '';
347
- }
348
- }
349
-
350
- module.exports = {
351
- initSearchEngine,
352
- search,
353
- getSuggestions,
354
- getTrendingSearches,
355
- getSearchStats,
356
- purgeOldCache,
357
- };
1
+ /**
2
+ * WAB Search Engine — Independent search aggregator with caching,
3
+ * ranking, suggestions, and trending queries.
4
+ *
5
+ * All results are served under the WAB brand — no external engine
6
+ * branding is ever exposed to the user.
7
+ */
8
+
9
+ const crypto = require('crypto');
10
+
11
+ let db;
12
+
13
+ function initSearchEngine(database) {
14
+ db = database;
15
+
16
+ db.exec(`
17
+ CREATE TABLE IF NOT EXISTS search_cache (
18
+ query_hash TEXT PRIMARY KEY,
19
+ query TEXT NOT NULL,
20
+ results TEXT NOT NULL,
21
+ source TEXT DEFAULT 'multi',
22
+ created_at TEXT DEFAULT (datetime('now')),
23
+ hit_count INTEGER DEFAULT 1
24
+ );
25
+
26
+ CREATE TABLE IF NOT EXISTS search_history (
27
+ id INTEGER PRIMARY KEY AUTOINCREMENT,
28
+ query TEXT NOT NULL,
29
+ ip_hash TEXT,
30
+ results_count INTEGER DEFAULT 0,
31
+ created_at TEXT DEFAULT (datetime('now'))
32
+ );
33
+
34
+ CREATE TABLE IF NOT EXISTS search_suggestions (
35
+ query TEXT PRIMARY KEY,
36
+ frequency INTEGER DEFAULT 1,
37
+ last_searched TEXT DEFAULT (datetime('now'))
38
+ );
39
+
40
+ CREATE INDEX IF NOT EXISTS idx_search_cache_created ON search_cache(created_at);
41
+ CREATE INDEX IF NOT EXISTS idx_search_history_created ON search_history(created_at);
42
+ CREATE INDEX IF NOT EXISTS idx_search_suggestions_freq ON search_suggestions(frequency DESC);
43
+ `);
44
+ }
45
+
46
+ // ─── Cache Layer ──────────────────────────────────────────────────────
47
+
48
+ function queryHash(q) {
49
+ return crypto.createHash('sha256').update(q.toLowerCase().trim()).digest('hex').slice(0, 32);
50
+ }
51
+
52
+ function getCachedResults(query) {
53
+ const hash = queryHash(query);
54
+ const row = db.prepare(
55
+ `SELECT results, created_at FROM search_cache WHERE query_hash = ? AND created_at > datetime('now', '-1 hour')`
56
+ ).get(hash);
57
+ if (row) {
58
+ db.prepare(`UPDATE search_cache SET hit_count = hit_count + 1 WHERE query_hash = ?`).run(hash);
59
+ return JSON.parse(row.results);
60
+ }
61
+ return null;
62
+ }
63
+
64
+ function setCachedResults(query, results, source) {
65
+ const hash = queryHash(query);
66
+ db.prepare(
67
+ `INSERT OR REPLACE INTO search_cache (query_hash, query, results, source, created_at, hit_count)
68
+ VALUES (?, ?, ?, ?, datetime('now'), 1)`
69
+ ).run(hash, query.toLowerCase().trim(), JSON.stringify(results), source || 'multi');
70
+ }
71
+
72
+ // Purge old cache entries (>24h)
73
+ function purgeOldCache() {
74
+ db.prepare(`DELETE FROM search_cache WHERE created_at < datetime('now', '-1 day')`).run();
75
+ }
76
+
77
+ // ─── Search History & Suggestions ─────────────────────────────────────
78
+
79
+ function recordSearch(query, ipHash, resultsCount) {
80
+ db.prepare(
81
+ `INSERT INTO search_history (query, ip_hash, results_count) VALUES (?, ?, ?)`
82
+ ).run(query.trim(), ipHash || null, resultsCount);
83
+
84
+ // Update suggestion frequency
85
+ const normalized = query.toLowerCase().trim();
86
+ if (normalized.length >= 2 && normalized.length <= 100) {
87
+ const existing = db.prepare(`SELECT frequency FROM search_suggestions WHERE query = ?`).get(normalized);
88
+ if (existing) {
89
+ db.prepare(`UPDATE search_suggestions SET frequency = frequency + 1, last_searched = datetime('now') WHERE query = ?`).run(normalized);
90
+ } else {
91
+ db.prepare(`INSERT INTO search_suggestions (query, frequency) VALUES (?, 1)`).run(normalized);
92
+ }
93
+ }
94
+ }
95
+
96
+ function getSuggestions(prefix, limit = 8) {
97
+ if (!prefix || prefix.length < 1) return [];
98
+ const normalized = prefix.toLowerCase().trim();
99
+ return db.prepare(
100
+ `SELECT query, frequency FROM search_suggestions
101
+ WHERE query LIKE ? AND frequency > 0
102
+ ORDER BY frequency DESC, last_searched DESC LIMIT ?`
103
+ ).all(normalized + '%', limit).map(r => r.query);
104
+ }
105
+
106
+ function getTrendingSearches(limit = 10) {
107
+ return db.prepare(
108
+ `SELECT query, COUNT(*) as count FROM search_history
109
+ WHERE created_at > datetime('now', '-24 hours')
110
+ GROUP BY LOWER(query) ORDER BY count DESC LIMIT ?`
111
+ ).all(limit).map(r => ({ query: r.query, count: r.count }));
112
+ }
113
+
114
+ function getSearchStats() {
115
+ const total = db.prepare(`SELECT COUNT(*) as c FROM search_history`).get().c;
116
+ const today = db.prepare(`SELECT COUNT(*) as c FROM search_history WHERE created_at > datetime('now', '-24 hours')`).get().c;
117
+ const cached = db.prepare(`SELECT COUNT(*) as c FROM search_cache`).get().c;
118
+ const uniqueQueries = db.prepare(`SELECT COUNT(DISTINCT LOWER(query)) as c FROM search_history`).get().c;
119
+ return { total, today, cached, uniqueQueries };
120
+ }
121
+
122
+ // ─── Multi-Source Search ──────────────────────────────────────────────
123
+
124
+ const UA = 'Mozilla/5.0 (Linux; Android 13) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36';
125
+ const HEADERS = {
126
+ 'User-Agent': UA,
127
+ 'Accept': 'text/html',
128
+ 'Accept-Language': 'en-US,en;q=0.9,ar;q=0.8',
129
+ };
130
+
131
+ async function searchDDG(q) {
132
+ try {
133
+ const url = 'https://html.duckduckgo.com/html/?q=' + encodeURIComponent(q);
134
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
135
+ const html = await resp.text();
136
+ const results = [];
137
+ const resultPattern = /<a[^>]+class="result__a"[^>]+href="([^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
138
+ const snippetPattern = /<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/gi;
139
+ const urls = [], titles = [], snippets = [];
140
+ let m;
141
+ while ((m = resultPattern.exec(html)) !== null) {
142
+ urls.push(m[1]);
143
+ titles.push(stripHtml(m[2]));
144
+ }
145
+ while ((m = snippetPattern.exec(html)) !== null) {
146
+ snippets.push(decodeEntities(stripHtml(m[1])));
147
+ }
148
+ for (let i = 0; i < Math.min(urls.length, 15); i++) {
149
+ let u = urls[i];
150
+ const uddg = u.match(/uddg=([^&]+)/);
151
+ if (uddg) u = decodeURIComponent(uddg[1]);
152
+ if (!u.startsWith('http')) continue;
153
+ results.push({ title: titles[i] || u, url: u, snippet: snippets[i] || '', source: 'ddg' });
154
+ }
155
+ return results;
156
+ } catch (e) {
157
+ return [];
158
+ }
159
+ }
160
+
161
+ async function searchGoogle(q) {
162
+ try {
163
+ const url = 'https://www.google.com/search?q=' + encodeURIComponent(q) + '&num=15&hl=en';
164
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
165
+ const html = await resp.text();
166
+ const results = [];
167
+ const linkPattern = /<a[^>]+href="\/url\?q=([^&"]+)[^"]*"[^>]*>([\s\S]*?)<\/a>/gi;
168
+ let m;
169
+ while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
170
+ const u = decodeURIComponent(m[1]);
171
+ if (!u.startsWith('http')) continue;
172
+ try { if (new URL(u).hostname.includes('google.')) continue; } catch { continue; }
173
+ const title = stripHtml(m[2]);
174
+ if (!title) continue;
175
+ results.push({ title, url: u, snippet: '', source: 'google' });
176
+ }
177
+ return results;
178
+ } catch (e) {
179
+ return [];
180
+ }
181
+ }
182
+
183
+ async function searchBing(q) {
184
+ try {
185
+ const url = 'https://www.bing.com/search?q=' + encodeURIComponent(q) + '&count=15';
186
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
187
+ const html = await resp.text();
188
+ const results = [];
189
+ // Bing result links: <a href="URL" h="ID=..."><strong>title</strong></a>
190
+ const linkPattern = /<li class="b_algo"[^>]*>[\s\S]*?<a[^>]+href="(https?:\/\/[^"]+)"[^>]*>([\s\S]*?)<\/a>[\s\S]*?<p[^>]*>([\s\S]*?)<\/p>/gi;
191
+ let m;
192
+ while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
193
+ const u = m[1];
194
+ if (!u.startsWith('http')) continue;
195
+ try { if (new URL(u).hostname.includes('bing.')) continue; } catch { continue; }
196
+ const title = stripHtml(m[2]);
197
+ const snippet = decodeEntities(stripHtml(m[3]));
198
+ if (!title) continue;
199
+ results.push({ title, url: u, snippet, source: 'bing' });
200
+ }
201
+ return results;
202
+ } catch (e) {
203
+ return [];
204
+ }
205
+ }
206
+
207
+ // ─── Result Ranking Engine ────────────────────────────────────────────
208
+
209
+ function rankResults(allResults) {
210
+ // Deduplicate by URL (keep the one with the best snippet)
211
+ const seen = new Map();
212
+ for (const r of allResults) {
213
+ const normalizedUrl = normalizeUrl(r.url);
214
+ const existing = seen.get(normalizedUrl);
215
+ if (!existing) {
216
+ seen.set(normalizedUrl, { ...r, sourceCount: 1 });
217
+ } else {
218
+ existing.sourceCount++;
219
+ // Prefer the version with a snippet
220
+ if (!existing.snippet && r.snippet) {
221
+ existing.snippet = r.snippet;
222
+ }
223
+ // Prefer longer title
224
+ if (r.title.length > existing.title.length) {
225
+ existing.title = r.title;
226
+ }
227
+ }
228
+ }
229
+
230
+ const deduplicated = Array.from(seen.values());
231
+
232
+ // Score each result
233
+ for (const r of deduplicated) {
234
+ let score = 0;
235
+
236
+ // Multi-source bonus: appearing in multiple engines means higher relevance
237
+ score += (r.sourceCount - 1) * 30;
238
+
239
+ // Snippet presence
240
+ if (r.snippet && r.snippet.length > 20) score += 15;
241
+
242
+ // HTTPS bonus
243
+ if (r.url.startsWith('https://')) score += 5;
244
+
245
+ // Domain diversity: boost independent/small sites
246
+ const hostname = safeHostname(r.url);
247
+ const bigTech = ['google.com','youtube.com','facebook.com','amazon.com','apple.com','microsoft.com','twitter.com','x.com','instagram.com','tiktok.com','linkedin.com','reddit.com','pinterest.com'];
248
+ const isBigTech = bigTech.some(d => hostname === d || hostname.endsWith('.' + d));
249
+ if (!isBigTech) score += 8;
250
+
251
+ // Trusted TLDs
252
+ const tld = hostname.split('.').pop();
253
+ if (['org','edu','gov','dev'].includes(tld)) score += 5;
254
+
255
+ // Penalize very long URLs (likely junk)
256
+ if (r.url.length > 200) score -= 10;
257
+
258
+ r.score = score;
259
+ }
260
+
261
+ // Sort by score descending, then by original order
262
+ deduplicated.sort((a, b) => b.score - a.score);
263
+
264
+ // Return top 15, strip internal fields
265
+ return deduplicated.slice(0, 15).map(r => ({
266
+ title: r.title,
267
+ url: r.url,
268
+ snippet: r.snippet || '',
269
+ }));
270
+ }
271
+
272
+ // ─── Main Search Function ─────────────────────────────────────────────
273
+
274
+ async function search(query, ipHash) {
275
+ if (!query || !query.trim()) return { results: [], cached: false };
276
+
277
+ const q = query.trim();
278
+
279
+ // Check cache first
280
+ const cached = getCachedResults(q);
281
+ if (cached && cached.length > 0) {
282
+ recordSearch(q, ipHash, cached.length);
283
+ return { results: cached, cached: true };
284
+ }
285
+
286
+ // Fetch from all sources in parallel
287
+ const [ddgResults, googleResults, bingResults] = await Promise.allSettled([
288
+ searchDDG(q),
289
+ searchGoogle(q),
290
+ searchBing(q),
291
+ ]);
292
+
293
+ const allResults = [
294
+ ...(ddgResults.status === 'fulfilled' ? ddgResults.value : []),
295
+ ...(googleResults.status === 'fulfilled' ? googleResults.value : []),
296
+ ...(bingResults.status === 'fulfilled' ? bingResults.value : []),
297
+ ];
298
+
299
+ if (allResults.length === 0) {
300
+ recordSearch(q, ipHash, 0);
301
+ return { results: [], cached: false };
302
+ }
303
+
304
+ // Rank and deduplicate
305
+ const ranked = rankResults(allResults);
306
+
307
+ // Cache results
308
+ setCachedResults(q, ranked, 'multi');
309
+
310
+ // Record search
311
+ recordSearch(q, ipHash, ranked.length);
312
+
313
+ return { results: ranked, cached: false };
314
+ }
315
+
316
+ // ─── Helpers ──────────────────────────────────────────────────────────
317
+
318
+ function stripHtml(s) {
319
+ return (s || '').replace(/<[^>]+>/g, '').trim();
320
+ }
321
+
322
+ function decodeEntities(s) {
323
+ return (s || '')
324
+ .replace(/&amp;/g, '&')
325
+ .replace(/&lt;/g, '<')
326
+ .replace(/&gt;/g, '>')
327
+ .replace(/&quot;/g, '"')
328
+ .replace(/&#x27;/g, "'")
329
+ .replace(/&#39;/g, "'")
330
+ .trim();
331
+ }
332
+
333
+ function normalizeUrl(url) {
334
+ try {
335
+ const u = new URL(url);
336
+ return u.hostname.replace(/^www\./, '') + u.pathname.replace(/\/$/, '') + u.search;
337
+ } catch {
338
+ return url;
339
+ }
340
+ }
341
+
342
+ function safeHostname(url) {
343
+ try {
344
+ return new URL(url).hostname.replace(/^www\./, '');
345
+ } catch {
346
+ return '';
347
+ }
348
+ }
349
+
350
+ module.exports = {
351
+ initSearchEngine,
352
+ search,
353
+ getSuggestions,
354
+ getTrendingSearches,
355
+ getSearchStats,
356
+ purgeOldCache,
357
+ };