web-agent-bridge 3.2.0 → 3.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (256) hide show
  1. package/LICENSE +84 -72
  2. package/README.ar.md +1304 -1152
  3. package/README.md +298 -1635
  4. package/bin/agent-runner.js +474 -474
  5. package/bin/cli.js +237 -138
  6. package/bin/wab-init.js +223 -0
  7. package/bin/wab.js +80 -80
  8. package/examples/azure-dns-wab.js +83 -0
  9. package/examples/bidi-agent.js +119 -119
  10. package/examples/cloudflare-wab-dns.js +121 -0
  11. package/examples/cpanel-wab-dns.js +114 -0
  12. package/examples/cross-site-agent.js +91 -91
  13. package/examples/dns-discovery-agent.js +166 -0
  14. package/examples/gcp-dns-wab.js +76 -0
  15. package/examples/governance-agent.js +169 -0
  16. package/examples/mcp-agent.js +94 -94
  17. package/examples/next-app-router/README.md +44 -44
  18. package/examples/plesk-wab-dns.js +103 -0
  19. package/examples/puppeteer-agent.js +108 -108
  20. package/examples/route53-wab-dns.js +144 -0
  21. package/examples/saas-dashboard/README.md +55 -55
  22. package/examples/safe-mode-agent.js +96 -0
  23. package/examples/shopify-hydrogen/README.md +74 -74
  24. package/examples/vision-agent.js +171 -171
  25. package/examples/wab-sign.js +74 -0
  26. package/examples/wab-verify.js +60 -0
  27. package/examples/wordpress-elementor/README.md +77 -77
  28. package/package.json +19 -6
  29. package/public/.well-known/agent-tools.json +180 -180
  30. package/public/.well-known/ai-assets.json +59 -59
  31. package/public/.well-known/security.txt +8 -0
  32. package/public/.well-known/wab.json +28 -0
  33. package/public/activate.html +368 -0
  34. package/public/adoption-metrics.html +188 -0
  35. package/public/agent-workspace.html +349 -349
  36. package/public/ai.html +198 -198
  37. package/public/api.html +413 -412
  38. package/public/azure-dns-integration.html +289 -0
  39. package/public/browser.html +486 -486
  40. package/public/cloudflare-integration.html +380 -0
  41. package/public/commander-dashboard.html +243 -243
  42. package/public/cookies.html +210 -210
  43. package/public/cpanel-integration.html +398 -0
  44. package/public/css/agent-workspace.css +1713 -1713
  45. package/public/css/premium.css +317 -317
  46. package/public/css/styles.css +1263 -1235
  47. package/public/dashboard.html +707 -706
  48. package/public/dns.html +436 -0
  49. package/public/docs.html +588 -587
  50. package/public/feed.xml +89 -89
  51. package/public/gcp-dns-integration.html +318 -0
  52. package/public/growth.html +465 -463
  53. package/public/index.html +1266 -982
  54. package/public/integrations.html +556 -0
  55. package/public/js/activate.js +145 -0
  56. package/public/js/agent-workspace.js +1740 -1740
  57. package/public/js/auth-nav.js +65 -31
  58. package/public/js/auth-redirect.js +12 -12
  59. package/public/js/cookie-consent.js +56 -56
  60. package/public/js/dns.js +438 -0
  61. package/public/js/wab-demo-page.js +721 -721
  62. package/public/js/ws-client.js +74 -74
  63. package/public/llms-full.txt +360 -360
  64. package/public/llms.txt +125 -125
  65. package/public/login.html +85 -85
  66. package/public/mesh-dashboard.html +328 -328
  67. package/public/openapi.json +669 -580
  68. package/public/phone-shield.html +281 -0
  69. package/public/plesk-integration.html +375 -0
  70. package/public/premium-dashboard.html +2489 -2489
  71. package/public/premium.html +793 -793
  72. package/public/privacy.html +297 -297
  73. package/public/provider-onboarding.html +172 -0
  74. package/public/provider-sandbox.html +134 -0
  75. package/public/providers.html +359 -0
  76. package/public/register.html +105 -105
  77. package/public/registrar-integrations.html +141 -0
  78. package/public/robots.txt +99 -87
  79. package/public/route53-integration.html +531 -0
  80. package/public/script/wab-consent.d.ts +36 -36
  81. package/public/script/wab-consent.js +104 -104
  82. package/public/script/wab-schema.js +131 -131
  83. package/public/script/wab.d.ts +108 -108
  84. package/public/script/wab.min.js +580 -580
  85. package/public/security.txt +8 -0
  86. package/public/shieldqr.html +231 -0
  87. package/public/sitemap.xml +6 -0
  88. package/public/terms.html +256 -256
  89. package/public/wab-trust.html +200 -0
  90. package/public/wab-vs-protocols.html +210 -0
  91. package/public/whitepaper.html +449 -0
  92. package/script/ai-agent-bridge.js +1754 -1754
  93. package/sdk/README.md +99 -99
  94. package/sdk/agent-mesh.js +449 -449
  95. package/sdk/auto-discovery.js +288 -0
  96. package/sdk/commander.js +262 -262
  97. package/sdk/governance.js +262 -0
  98. package/sdk/index.d.ts +464 -464
  99. package/sdk/index.js +25 -1
  100. package/sdk/multi-agent.js +318 -318
  101. package/sdk/package.json +2 -2
  102. package/sdk/safe-mode.js +221 -0
  103. package/sdk/safety-shield.js +219 -0
  104. package/sdk/schema-discovery.js +83 -83
  105. package/server/adapters/index.js +520 -520
  106. package/server/config/plans.js +367 -367
  107. package/server/config/secrets.js +102 -102
  108. package/server/control-plane/index.js +301 -301
  109. package/server/data-plane/index.js +354 -354
  110. package/server/index.js +670 -427
  111. package/server/llm/index.js +404 -404
  112. package/server/middleware/adminAuth.js +35 -35
  113. package/server/middleware/auth.js +50 -50
  114. package/server/middleware/featureGate.js +88 -88
  115. package/server/middleware/rateLimits.js +100 -100
  116. package/server/middleware/sensitiveAction.js +157 -0
  117. package/server/migrations/001_add_analytics_indexes.sql +7 -7
  118. package/server/migrations/002_premium_features.sql +418 -418
  119. package/server/migrations/003_ads_integer_cents.sql +33 -33
  120. package/server/migrations/004_agent_os.sql +158 -158
  121. package/server/migrations/005_marketplace_metering.sql +126 -126
  122. package/server/migrations/007_governance.sql +106 -0
  123. package/server/migrations/008_plans.sql +144 -0
  124. package/server/migrations/009_shieldqr.sql +30 -0
  125. package/server/migrations/010_extended_trust.sql +33 -0
  126. package/server/models/adapters/index.js +33 -33
  127. package/server/models/adapters/mysql.js +183 -183
  128. package/server/models/adapters/postgresql.js +172 -172
  129. package/server/models/adapters/sqlite.js +7 -7
  130. package/server/models/db.js +740 -681
  131. package/server/observability/failure-analysis.js +337 -337
  132. package/server/observability/index.js +394 -394
  133. package/server/protocol/capabilities.js +223 -223
  134. package/server/protocol/index.js +243 -243
  135. package/server/protocol/schema.js +584 -584
  136. package/server/registry/certification.js +271 -271
  137. package/server/registry/index.js +326 -326
  138. package/server/routes/admin-plans.js +76 -0
  139. package/server/routes/admin-premium.js +673 -671
  140. package/server/routes/admin-shieldqr.js +90 -0
  141. package/server/routes/admin-trust-monitor.js +83 -0
  142. package/server/routes/admin.js +549 -261
  143. package/server/routes/ads.js +130 -130
  144. package/server/routes/agent-workspace.js +540 -540
  145. package/server/routes/api.js +150 -150
  146. package/server/routes/auth.js +71 -71
  147. package/server/routes/billing.js +57 -45
  148. package/server/routes/commander.js +316 -316
  149. package/server/routes/demo-showcase.js +332 -332
  150. package/server/routes/demo-store.js +154 -0
  151. package/server/routes/discovery.js +2348 -417
  152. package/server/routes/gateway.js +173 -157
  153. package/server/routes/governance.js +208 -0
  154. package/server/routes/license.js +251 -240
  155. package/server/routes/mesh.js +469 -469
  156. package/server/routes/noscript.js +543 -543
  157. package/server/routes/plans.js +33 -0
  158. package/server/routes/premium-v2.js +686 -686
  159. package/server/routes/premium.js +724 -724
  160. package/server/routes/providers.js +650 -0
  161. package/server/routes/runtime.js +2148 -2147
  162. package/server/routes/shieldqr.js +88 -0
  163. package/server/routes/sovereign.js +465 -385
  164. package/server/routes/universal.js +200 -185
  165. package/server/routes/wab-api.js +850 -501
  166. package/server/runtime/container-worker.js +111 -111
  167. package/server/runtime/container.js +448 -448
  168. package/server/runtime/distributed-worker.js +362 -362
  169. package/server/runtime/event-bus.js +210 -210
  170. package/server/runtime/index.js +253 -253
  171. package/server/runtime/queue.js +599 -599
  172. package/server/runtime/replay.js +666 -666
  173. package/server/runtime/sandbox.js +266 -266
  174. package/server/runtime/scheduler.js +534 -534
  175. package/server/runtime/session-engine.js +293 -293
  176. package/server/runtime/state-manager.js +188 -188
  177. package/server/security/cross-site-redactor.js +196 -0
  178. package/server/security/dry-run.js +180 -0
  179. package/server/security/human-gate-rate-limit.js +147 -0
  180. package/server/security/human-gate-transports.js +178 -0
  181. package/server/security/human-gate.js +281 -0
  182. package/server/security/index.js +368 -368
  183. package/server/security/intent-engine.js +245 -0
  184. package/server/security/reward-guard.js +171 -0
  185. package/server/security/rollback-store.js +239 -0
  186. package/server/security/token-scope.js +404 -0
  187. package/server/security/url-policy.js +139 -0
  188. package/server/services/agent-chat.js +506 -506
  189. package/server/services/agent-learning.js +601 -575
  190. package/server/services/agent-memory.js +625 -625
  191. package/server/services/agent-mesh.js +555 -539
  192. package/server/services/agent-symphony.js +717 -717
  193. package/server/services/agent-tasks.js +1807 -1807
  194. package/server/services/api-key-engine.js +292 -261
  195. package/server/services/cluster.js +894 -894
  196. package/server/services/commander.js +738 -738
  197. package/server/services/edge-compute.js +440 -440
  198. package/server/services/email.js +233 -204
  199. package/server/services/governance.js +466 -0
  200. package/server/services/hosted-runtime.js +205 -205
  201. package/server/services/lfd.js +635 -635
  202. package/server/services/local-ai.js +389 -389
  203. package/server/services/marketplace.js +270 -270
  204. package/server/services/metering.js +182 -182
  205. package/server/services/modules/affiliate-intelligence.js +93 -93
  206. package/server/services/modules/agent-firewall.js +90 -90
  207. package/server/services/modules/bounty.js +89 -89
  208. package/server/services/modules/collective-bargaining.js +92 -92
  209. package/server/services/modules/dark-pattern.js +66 -66
  210. package/server/services/modules/gov-intelligence.js +45 -45
  211. package/server/services/modules/neural.js +55 -55
  212. package/server/services/modules/notary.js +49 -49
  213. package/server/services/modules/price-time-machine.js +86 -86
  214. package/server/services/modules/protocol.js +104 -104
  215. package/server/services/negotiation.js +439 -439
  216. package/server/services/plans.js +214 -0
  217. package/server/services/plugins.js +771 -771
  218. package/server/services/premium.js +1 -1
  219. package/server/services/price-intelligence.js +566 -566
  220. package/server/services/price-shield.js +1137 -1137
  221. package/server/services/provider-clients.js +740 -0
  222. package/server/services/reputation.js +465 -465
  223. package/server/services/search-engine.js +357 -357
  224. package/server/services/security.js +513 -513
  225. package/server/services/self-healing.js +843 -843
  226. package/server/services/shieldqr.js +322 -0
  227. package/server/services/sovereign-shield.js +542 -0
  228. package/server/services/ssl-inspector.js +42 -0
  229. package/server/services/ssl-monitor.js +167 -0
  230. package/server/services/stripe.js +205 -192
  231. package/server/services/swarm.js +788 -788
  232. package/server/services/universal-scraper.js +662 -661
  233. package/server/services/verification.js +481 -481
  234. package/server/services/vision.js +1163 -1163
  235. package/server/services/wab-crypto.js +178 -0
  236. package/server/utils/cache.js +125 -125
  237. package/server/utils/migrate.js +81 -81
  238. package/server/utils/safe-fetch.js +228 -0
  239. package/server/utils/secureFields.js +50 -50
  240. package/server/ws.js +161 -161
  241. package/templates/artisan-marketplace.yaml +104 -104
  242. package/templates/book-price-scout.yaml +98 -98
  243. package/templates/electronics-price-tracker.yaml +108 -108
  244. package/templates/flight-deal-hunter.yaml +113 -113
  245. package/templates/freelancer-direct.yaml +116 -116
  246. package/templates/grocery-price-compare.yaml +93 -93
  247. package/templates/hotel-direct-booking.yaml +113 -113
  248. package/templates/local-services.yaml +98 -98
  249. package/templates/olive-oil-tunisia.yaml +88 -88
  250. package/templates/organic-farm-fresh.yaml +101 -101
  251. package/templates/restaurant-direct.yaml +97 -97
  252. package/public/score.html +0 -263
  253. package/server/migrations/006_growth_suite.sql +0 -138
  254. package/server/routes/growth.js +0 -962
  255. package/server/services/fairness-engine.js +0 -409
  256. package/server/services/fairness.js +0 -420
@@ -1,357 +1,357 @@
1
- /**
2
- * WAB Search Engine — Independent search aggregator with caching,
3
- * ranking, suggestions, and trending queries.
4
- *
5
- * All results are served under the WAB brand — no external engine
6
- * branding is ever exposed to the user.
7
- */
8
-
9
- const crypto = require('crypto');
10
-
11
- let db;
12
-
13
- function initSearchEngine(database) {
14
- db = database;
15
-
16
- db.exec(`
17
- CREATE TABLE IF NOT EXISTS search_cache (
18
- query_hash TEXT PRIMARY KEY,
19
- query TEXT NOT NULL,
20
- results TEXT NOT NULL,
21
- source TEXT DEFAULT 'multi',
22
- created_at TEXT DEFAULT (datetime('now')),
23
- hit_count INTEGER DEFAULT 1
24
- );
25
-
26
- CREATE TABLE IF NOT EXISTS search_history (
27
- id INTEGER PRIMARY KEY AUTOINCREMENT,
28
- query TEXT NOT NULL,
29
- ip_hash TEXT,
30
- results_count INTEGER DEFAULT 0,
31
- created_at TEXT DEFAULT (datetime('now'))
32
- );
33
-
34
- CREATE TABLE IF NOT EXISTS search_suggestions (
35
- query TEXT PRIMARY KEY,
36
- frequency INTEGER DEFAULT 1,
37
- last_searched TEXT DEFAULT (datetime('now'))
38
- );
39
-
40
- CREATE INDEX IF NOT EXISTS idx_search_cache_created ON search_cache(created_at);
41
- CREATE INDEX IF NOT EXISTS idx_search_history_created ON search_history(created_at);
42
- CREATE INDEX IF NOT EXISTS idx_search_suggestions_freq ON search_suggestions(frequency DESC);
43
- `);
44
- }
45
-
46
- // ─── Cache Layer ──────────────────────────────────────────────────────
47
-
48
- function queryHash(q) {
49
- return crypto.createHash('sha256').update(q.toLowerCase().trim()).digest('hex').slice(0, 32);
50
- }
51
-
52
- function getCachedResults(query) {
53
- const hash = queryHash(query);
54
- const row = db.prepare(
55
- `SELECT results, created_at FROM search_cache WHERE query_hash = ? AND created_at > datetime('now', '-1 hour')`
56
- ).get(hash);
57
- if (row) {
58
- db.prepare(`UPDATE search_cache SET hit_count = hit_count + 1 WHERE query_hash = ?`).run(hash);
59
- return JSON.parse(row.results);
60
- }
61
- return null;
62
- }
63
-
64
- function setCachedResults(query, results, source) {
65
- const hash = queryHash(query);
66
- db.prepare(
67
- `INSERT OR REPLACE INTO search_cache (query_hash, query, results, source, created_at, hit_count)
68
- VALUES (?, ?, ?, ?, datetime('now'), 1)`
69
- ).run(hash, query.toLowerCase().trim(), JSON.stringify(results), source || 'multi');
70
- }
71
-
72
- // Purge old cache entries (>24h)
73
- function purgeOldCache() {
74
- db.prepare(`DELETE FROM search_cache WHERE created_at < datetime('now', '-1 day')`).run();
75
- }
76
-
77
- // ─── Search History & Suggestions ─────────────────────────────────────
78
-
79
- function recordSearch(query, ipHash, resultsCount) {
80
- db.prepare(
81
- `INSERT INTO search_history (query, ip_hash, results_count) VALUES (?, ?, ?)`
82
- ).run(query.trim(), ipHash || null, resultsCount);
83
-
84
- // Update suggestion frequency
85
- const normalized = query.toLowerCase().trim();
86
- if (normalized.length >= 2 && normalized.length <= 100) {
87
- const existing = db.prepare(`SELECT frequency FROM search_suggestions WHERE query = ?`).get(normalized);
88
- if (existing) {
89
- db.prepare(`UPDATE search_suggestions SET frequency = frequency + 1, last_searched = datetime('now') WHERE query = ?`).run(normalized);
90
- } else {
91
- db.prepare(`INSERT INTO search_suggestions (query, frequency) VALUES (?, 1)`).run(normalized);
92
- }
93
- }
94
- }
95
-
96
- function getSuggestions(prefix, limit = 8) {
97
- if (!prefix || prefix.length < 1) return [];
98
- const normalized = prefix.toLowerCase().trim();
99
- return db.prepare(
100
- `SELECT query, frequency FROM search_suggestions
101
- WHERE query LIKE ? AND frequency > 0
102
- ORDER BY frequency DESC, last_searched DESC LIMIT ?`
103
- ).all(normalized + '%', limit).map(r => r.query);
104
- }
105
-
106
- function getTrendingSearches(limit = 10) {
107
- return db.prepare(
108
- `SELECT query, COUNT(*) as count FROM search_history
109
- WHERE created_at > datetime('now', '-24 hours')
110
- GROUP BY LOWER(query) ORDER BY count DESC LIMIT ?`
111
- ).all(limit).map(r => ({ query: r.query, count: r.count }));
112
- }
113
-
114
- function getSearchStats() {
115
- const total = db.prepare(`SELECT COUNT(*) as c FROM search_history`).get().c;
116
- const today = db.prepare(`SELECT COUNT(*) as c FROM search_history WHERE created_at > datetime('now', '-24 hours')`).get().c;
117
- const cached = db.prepare(`SELECT COUNT(*) as c FROM search_cache`).get().c;
118
- const uniqueQueries = db.prepare(`SELECT COUNT(DISTINCT LOWER(query)) as c FROM search_history`).get().c;
119
- return { total, today, cached, uniqueQueries };
120
- }
121
-
122
- // ─── Multi-Source Search ──────────────────────────────────────────────
123
-
124
- const UA = 'Mozilla/5.0 (Linux; Android 13) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36';
125
- const HEADERS = {
126
- 'User-Agent': UA,
127
- 'Accept': 'text/html',
128
- 'Accept-Language': 'en-US,en;q=0.9,ar;q=0.8',
129
- };
130
-
131
- async function searchDDG(q) {
132
- try {
133
- const url = 'https://html.duckduckgo.com/html/?q=' + encodeURIComponent(q);
134
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
135
- const html = await resp.text();
136
- const results = [];
137
- const resultPattern = /<a[^>]+class="result__a"[^>]+href="([^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
138
- const snippetPattern = /<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/gi;
139
- const urls = [], titles = [], snippets = [];
140
- let m;
141
- while ((m = resultPattern.exec(html)) !== null) {
142
- urls.push(m[1]);
143
- titles.push(stripHtml(m[2]));
144
- }
145
- while ((m = snippetPattern.exec(html)) !== null) {
146
- snippets.push(decodeEntities(stripHtml(m[1])));
147
- }
148
- for (let i = 0; i < Math.min(urls.length, 15); i++) {
149
- let u = urls[i];
150
- const uddg = u.match(/uddg=([^&]+)/);
151
- if (uddg) u = decodeURIComponent(uddg[1]);
152
- if (!u.startsWith('http')) continue;
153
- results.push({ title: titles[i] || u, url: u, snippet: snippets[i] || '', source: 'ddg' });
154
- }
155
- return results;
156
- } catch (e) {
157
- return [];
158
- }
159
- }
160
-
161
- async function searchGoogle(q) {
162
- try {
163
- const url = 'https://www.google.com/search?q=' + encodeURIComponent(q) + '&num=15&hl=en';
164
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
165
- const html = await resp.text();
166
- const results = [];
167
- const linkPattern = /<a[^>]+href="\/url\?q=([^&"]+)[^"]*"[^>]*>([\s\S]*?)<\/a>/gi;
168
- let m;
169
- while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
170
- const u = decodeURIComponent(m[1]);
171
- if (!u.startsWith('http')) continue;
172
- try { if (new URL(u).hostname.includes('google.')) continue; } catch { continue; }
173
- const title = stripHtml(m[2]);
174
- if (!title) continue;
175
- results.push({ title, url: u, snippet: '', source: 'google' });
176
- }
177
- return results;
178
- } catch (e) {
179
- return [];
180
- }
181
- }
182
-
183
- async function searchBing(q) {
184
- try {
185
- const url = 'https://www.bing.com/search?q=' + encodeURIComponent(q) + '&count=15';
186
- const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
187
- const html = await resp.text();
188
- const results = [];
189
- // Bing result links: <a href="URL" h="ID=..."><strong>title</strong></a>
190
- const linkPattern = /<li class="b_algo"[^>]*>[\s\S]*?<a[^>]+href="(https?:\/\/[^"]+)"[^>]*>([\s\S]*?)<\/a>[\s\S]*?<p[^>]*>([\s\S]*?)<\/p>/gi;
191
- let m;
192
- while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
193
- const u = m[1];
194
- if (!u.startsWith('http')) continue;
195
- try { if (new URL(u).hostname.includes('bing.')) continue; } catch { continue; }
196
- const title = stripHtml(m[2]);
197
- const snippet = decodeEntities(stripHtml(m[3]));
198
- if (!title) continue;
199
- results.push({ title, url: u, snippet, source: 'bing' });
200
- }
201
- return results;
202
- } catch (e) {
203
- return [];
204
- }
205
- }
206
-
207
- // ─── Result Ranking Engine ────────────────────────────────────────────
208
-
209
- function rankResults(allResults) {
210
- // Deduplicate by URL (keep the one with the best snippet)
211
- const seen = new Map();
212
- for (const r of allResults) {
213
- const normalizedUrl = normalizeUrl(r.url);
214
- const existing = seen.get(normalizedUrl);
215
- if (!existing) {
216
- seen.set(normalizedUrl, { ...r, sourceCount: 1 });
217
- } else {
218
- existing.sourceCount++;
219
- // Prefer the version with a snippet
220
- if (!existing.snippet && r.snippet) {
221
- existing.snippet = r.snippet;
222
- }
223
- // Prefer longer title
224
- if (r.title.length > existing.title.length) {
225
- existing.title = r.title;
226
- }
227
- }
228
- }
229
-
230
- const deduplicated = Array.from(seen.values());
231
-
232
- // Score each result
233
- for (const r of deduplicated) {
234
- let score = 0;
235
-
236
- // Multi-source bonus: appearing in multiple engines means higher relevance
237
- score += (r.sourceCount - 1) * 30;
238
-
239
- // Snippet presence
240
- if (r.snippet && r.snippet.length > 20) score += 15;
241
-
242
- // HTTPS bonus
243
- if (r.url.startsWith('https://')) score += 5;
244
-
245
- // Domain diversity: boost independent/small sites
246
- const hostname = safeHostname(r.url);
247
- const bigTech = ['google.com','youtube.com','facebook.com','amazon.com','apple.com','microsoft.com','twitter.com','x.com','instagram.com','tiktok.com','linkedin.com','reddit.com','pinterest.com'];
248
- const isBigTech = bigTech.some(d => hostname === d || hostname.endsWith('.' + d));
249
- if (!isBigTech) score += 8;
250
-
251
- // Trusted TLDs
252
- const tld = hostname.split('.').pop();
253
- if (['org','edu','gov','dev'].includes(tld)) score += 5;
254
-
255
- // Penalize very long URLs (likely junk)
256
- if (r.url.length > 200) score -= 10;
257
-
258
- r.score = score;
259
- }
260
-
261
- // Sort by score descending, then by original order
262
- deduplicated.sort((a, b) => b.score - a.score);
263
-
264
- // Return top 15, strip internal fields
265
- return deduplicated.slice(0, 15).map(r => ({
266
- title: r.title,
267
- url: r.url,
268
- snippet: r.snippet || '',
269
- }));
270
- }
271
-
272
- // ─── Main Search Function ─────────────────────────────────────────────
273
-
274
- async function search(query, ipHash) {
275
- if (!query || !query.trim()) return { results: [], cached: false };
276
-
277
- const q = query.trim();
278
-
279
- // Check cache first
280
- const cached = getCachedResults(q);
281
- if (cached && cached.length > 0) {
282
- recordSearch(q, ipHash, cached.length);
283
- return { results: cached, cached: true };
284
- }
285
-
286
- // Fetch from all sources in parallel
287
- const [ddgResults, googleResults, bingResults] = await Promise.allSettled([
288
- searchDDG(q),
289
- searchGoogle(q),
290
- searchBing(q),
291
- ]);
292
-
293
- const allResults = [
294
- ...(ddgResults.status === 'fulfilled' ? ddgResults.value : []),
295
- ...(googleResults.status === 'fulfilled' ? googleResults.value : []),
296
- ...(bingResults.status === 'fulfilled' ? bingResults.value : []),
297
- ];
298
-
299
- if (allResults.length === 0) {
300
- recordSearch(q, ipHash, 0);
301
- return { results: [], cached: false };
302
- }
303
-
304
- // Rank and deduplicate
305
- const ranked = rankResults(allResults);
306
-
307
- // Cache results
308
- setCachedResults(q, ranked, 'multi');
309
-
310
- // Record search
311
- recordSearch(q, ipHash, ranked.length);
312
-
313
- return { results: ranked, cached: false };
314
- }
315
-
316
- // ─── Helpers ──────────────────────────────────────────────────────────
317
-
318
- function stripHtml(s) {
319
- return (s || '').replace(/<[^>]+>/g, '').trim();
320
- }
321
-
322
- function decodeEntities(s) {
323
- return (s || '')
324
- .replace(/&amp;/g, '&')
325
- .replace(/&lt;/g, '<')
326
- .replace(/&gt;/g, '>')
327
- .replace(/&quot;/g, '"')
328
- .replace(/&#x27;/g, "'")
329
- .replace(/&#39;/g, "'")
330
- .trim();
331
- }
332
-
333
- function normalizeUrl(url) {
334
- try {
335
- const u = new URL(url);
336
- return u.hostname.replace(/^www\./, '') + u.pathname.replace(/\/$/, '') + u.search;
337
- } catch {
338
- return url;
339
- }
340
- }
341
-
342
- function safeHostname(url) {
343
- try {
344
- return new URL(url).hostname.replace(/^www\./, '');
345
- } catch {
346
- return '';
347
- }
348
- }
349
-
350
- module.exports = {
351
- initSearchEngine,
352
- search,
353
- getSuggestions,
354
- getTrendingSearches,
355
- getSearchStats,
356
- purgeOldCache,
357
- };
1
+ /**
2
+ * WAB Search Engine — Independent search aggregator with caching,
3
+ * ranking, suggestions, and trending queries.
4
+ *
5
+ * All results are served under the WAB brand — no external engine
6
+ * branding is ever exposed to the user.
7
+ */
8
+
9
+ const crypto = require('crypto');
10
+
11
+ let db;
12
+
13
+ function initSearchEngine(database) {
14
+ db = database;
15
+
16
+ db.exec(`
17
+ CREATE TABLE IF NOT EXISTS search_cache (
18
+ query_hash TEXT PRIMARY KEY,
19
+ query TEXT NOT NULL,
20
+ results TEXT NOT NULL,
21
+ source TEXT DEFAULT 'multi',
22
+ created_at TEXT DEFAULT (datetime('now')),
23
+ hit_count INTEGER DEFAULT 1
24
+ );
25
+
26
+ CREATE TABLE IF NOT EXISTS search_history (
27
+ id INTEGER PRIMARY KEY AUTOINCREMENT,
28
+ query TEXT NOT NULL,
29
+ ip_hash TEXT,
30
+ results_count INTEGER DEFAULT 0,
31
+ created_at TEXT DEFAULT (datetime('now'))
32
+ );
33
+
34
+ CREATE TABLE IF NOT EXISTS search_suggestions (
35
+ query TEXT PRIMARY KEY,
36
+ frequency INTEGER DEFAULT 1,
37
+ last_searched TEXT DEFAULT (datetime('now'))
38
+ );
39
+
40
+ CREATE INDEX IF NOT EXISTS idx_search_cache_created ON search_cache(created_at);
41
+ CREATE INDEX IF NOT EXISTS idx_search_history_created ON search_history(created_at);
42
+ CREATE INDEX IF NOT EXISTS idx_search_suggestions_freq ON search_suggestions(frequency DESC);
43
+ `);
44
+ }
45
+
46
+ // ─── Cache Layer ──────────────────────────────────────────────────────
47
+
48
+ function queryHash(q) {
49
+ return crypto.createHash('sha256').update(q.toLowerCase().trim()).digest('hex').slice(0, 32);
50
+ }
51
+
52
+ function getCachedResults(query) {
53
+ const hash = queryHash(query);
54
+ const row = db.prepare(
55
+ `SELECT results, created_at FROM search_cache WHERE query_hash = ? AND created_at > datetime('now', '-1 hour')`
56
+ ).get(hash);
57
+ if (row) {
58
+ db.prepare(`UPDATE search_cache SET hit_count = hit_count + 1 WHERE query_hash = ?`).run(hash);
59
+ return JSON.parse(row.results);
60
+ }
61
+ return null;
62
+ }
63
+
64
+ function setCachedResults(query, results, source) {
65
+ const hash = queryHash(query);
66
+ db.prepare(
67
+ `INSERT OR REPLACE INTO search_cache (query_hash, query, results, source, created_at, hit_count)
68
+ VALUES (?, ?, ?, ?, datetime('now'), 1)`
69
+ ).run(hash, query.toLowerCase().trim(), JSON.stringify(results), source || 'multi');
70
+ }
71
+
72
+ // Purge old cache entries (>24h)
73
+ function purgeOldCache() {
74
+ db.prepare(`DELETE FROM search_cache WHERE created_at < datetime('now', '-1 day')`).run();
75
+ }
76
+
77
+ // ─── Search History & Suggestions ─────────────────────────────────────
78
+
79
+ function recordSearch(query, ipHash, resultsCount) {
80
+ db.prepare(
81
+ `INSERT INTO search_history (query, ip_hash, results_count) VALUES (?, ?, ?)`
82
+ ).run(query.trim(), ipHash || null, resultsCount);
83
+
84
+ // Update suggestion frequency
85
+ const normalized = query.toLowerCase().trim();
86
+ if (normalized.length >= 2 && normalized.length <= 100) {
87
+ const existing = db.prepare(`SELECT frequency FROM search_suggestions WHERE query = ?`).get(normalized);
88
+ if (existing) {
89
+ db.prepare(`UPDATE search_suggestions SET frequency = frequency + 1, last_searched = datetime('now') WHERE query = ?`).run(normalized);
90
+ } else {
91
+ db.prepare(`INSERT INTO search_suggestions (query, frequency) VALUES (?, 1)`).run(normalized);
92
+ }
93
+ }
94
+ }
95
+
96
+ function getSuggestions(prefix, limit = 8) {
97
+ if (!prefix || prefix.length < 1) return [];
98
+ const normalized = prefix.toLowerCase().trim();
99
+ return db.prepare(
100
+ `SELECT query, frequency FROM search_suggestions
101
+ WHERE query LIKE ? AND frequency > 0
102
+ ORDER BY frequency DESC, last_searched DESC LIMIT ?`
103
+ ).all(normalized + '%', limit).map(r => r.query);
104
+ }
105
+
106
+ function getTrendingSearches(limit = 10) {
107
+ return db.prepare(
108
+ `SELECT query, COUNT(*) as count FROM search_history
109
+ WHERE created_at > datetime('now', '-24 hours')
110
+ GROUP BY LOWER(query) ORDER BY count DESC LIMIT ?`
111
+ ).all(limit).map(r => ({ query: r.query, count: r.count }));
112
+ }
113
+
114
+ function getSearchStats() {
115
+ const total = db.prepare(`SELECT COUNT(*) as c FROM search_history`).get().c;
116
+ const today = db.prepare(`SELECT COUNT(*) as c FROM search_history WHERE created_at > datetime('now', '-24 hours')`).get().c;
117
+ const cached = db.prepare(`SELECT COUNT(*) as c FROM search_cache`).get().c;
118
+ const uniqueQueries = db.prepare(`SELECT COUNT(DISTINCT LOWER(query)) as c FROM search_history`).get().c;
119
+ return { total, today, cached, uniqueQueries };
120
+ }
121
+
122
+ // ─── Multi-Source Search ──────────────────────────────────────────────
123
+
124
+ const UA = 'Mozilla/5.0 (Linux; Android 13) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36';
125
+ const HEADERS = {
126
+ 'User-Agent': UA,
127
+ 'Accept': 'text/html',
128
+ 'Accept-Language': 'en-US,en;q=0.9,ar;q=0.8',
129
+ };
130
+
131
+ async function searchDDG(q) {
132
+ try {
133
+ const url = 'https://html.duckduckgo.com/html/?q=' + encodeURIComponent(q);
134
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
135
+ const html = await resp.text();
136
+ const results = [];
137
+ const resultPattern = /<a[^>]+class="result__a"[^>]+href="([^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
138
+ const snippetPattern = /<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/gi;
139
+ const urls = [], titles = [], snippets = [];
140
+ let m;
141
+ while ((m = resultPattern.exec(html)) !== null) {
142
+ urls.push(m[1]);
143
+ titles.push(stripHtml(m[2]));
144
+ }
145
+ while ((m = snippetPattern.exec(html)) !== null) {
146
+ snippets.push(decodeEntities(stripHtml(m[1])));
147
+ }
148
+ for (let i = 0; i < Math.min(urls.length, 15); i++) {
149
+ let u = urls[i];
150
+ const uddg = u.match(/uddg=([^&]+)/);
151
+ if (uddg) u = decodeURIComponent(uddg[1]);
152
+ if (!u.startsWith('http')) continue;
153
+ results.push({ title: titles[i] || u, url: u, snippet: snippets[i] || '', source: 'ddg' });
154
+ }
155
+ return results;
156
+ } catch (e) {
157
+ return [];
158
+ }
159
+ }
160
+
161
+ async function searchGoogle(q) {
162
+ try {
163
+ const url = 'https://www.google.com/search?q=' + encodeURIComponent(q) + '&num=15&hl=en';
164
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
165
+ const html = await resp.text();
166
+ const results = [];
167
+ const linkPattern = /<a[^>]+href="\/url\?q=([^&"]+)[^"]*"[^>]*>([\s\S]*?)<\/a>/gi;
168
+ let m;
169
+ while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
170
+ const u = decodeURIComponent(m[1]);
171
+ if (!u.startsWith('http')) continue;
172
+ try { if (new URL(u).hostname.includes('google.')) continue; } catch { continue; }
173
+ const title = stripHtml(m[2]);
174
+ if (!title) continue;
175
+ results.push({ title, url: u, snippet: '', source: 'google' });
176
+ }
177
+ return results;
178
+ } catch (e) {
179
+ return [];
180
+ }
181
+ }
182
+
183
+ async function searchBing(q) {
184
+ try {
185
+ const url = 'https://www.bing.com/search?q=' + encodeURIComponent(q) + '&count=15';
186
+ const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
187
+ const html = await resp.text();
188
+ const results = [];
189
+ // Bing result links: <a href="URL" h="ID=..."><strong>title</strong></a>
190
+ const linkPattern = /<li class="b_algo"[^>]*>[\s\S]*?<a[^>]+href="(https?:\/\/[^"]+)"[^>]*>([\s\S]*?)<\/a>[\s\S]*?<p[^>]*>([\s\S]*?)<\/p>/gi;
191
+ let m;
192
+ while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
193
+ const u = m[1];
194
+ if (!u.startsWith('http')) continue;
195
+ try { if (new URL(u).hostname.includes('bing.')) continue; } catch { continue; }
196
+ const title = stripHtml(m[2]);
197
+ const snippet = decodeEntities(stripHtml(m[3]));
198
+ if (!title) continue;
199
+ results.push({ title, url: u, snippet, source: 'bing' });
200
+ }
201
+ return results;
202
+ } catch (e) {
203
+ return [];
204
+ }
205
+ }
206
+
207
+ // ─── Result Ranking Engine ────────────────────────────────────────────
208
+
209
+ function rankResults(allResults) {
210
+ // Deduplicate by URL (keep the one with the best snippet)
211
+ const seen = new Map();
212
+ for (const r of allResults) {
213
+ const normalizedUrl = normalizeUrl(r.url);
214
+ const existing = seen.get(normalizedUrl);
215
+ if (!existing) {
216
+ seen.set(normalizedUrl, { ...r, sourceCount: 1 });
217
+ } else {
218
+ existing.sourceCount++;
219
+ // Prefer the version with a snippet
220
+ if (!existing.snippet && r.snippet) {
221
+ existing.snippet = r.snippet;
222
+ }
223
+ // Prefer longer title
224
+ if (r.title.length > existing.title.length) {
225
+ existing.title = r.title;
226
+ }
227
+ }
228
+ }
229
+
230
+ const deduplicated = Array.from(seen.values());
231
+
232
+ // Score each result
233
+ for (const r of deduplicated) {
234
+ let score = 0;
235
+
236
+ // Multi-source bonus: appearing in multiple engines means higher relevance
237
+ score += (r.sourceCount - 1) * 30;
238
+
239
+ // Snippet presence
240
+ if (r.snippet && r.snippet.length > 20) score += 15;
241
+
242
+ // HTTPS bonus
243
+ if (r.url.startsWith('https://')) score += 5;
244
+
245
+ // Domain diversity: boost independent/small sites
246
+ const hostname = safeHostname(r.url);
247
+ const bigTech = ['google.com','youtube.com','facebook.com','amazon.com','apple.com','microsoft.com','twitter.com','x.com','instagram.com','tiktok.com','linkedin.com','reddit.com','pinterest.com'];
248
+ const isBigTech = bigTech.some(d => hostname === d || hostname.endsWith('.' + d));
249
+ if (!isBigTech) score += 8;
250
+
251
+ // Trusted TLDs
252
+ const tld = hostname.split('.').pop();
253
+ if (['org','edu','gov','dev'].includes(tld)) score += 5;
254
+
255
+ // Penalize very long URLs (likely junk)
256
+ if (r.url.length > 200) score -= 10;
257
+
258
+ r.score = score;
259
+ }
260
+
261
+ // Sort by score descending, then by original order
262
+ deduplicated.sort((a, b) => b.score - a.score);
263
+
264
+ // Return top 15, strip internal fields
265
+ return deduplicated.slice(0, 15).map(r => ({
266
+ title: r.title,
267
+ url: r.url,
268
+ snippet: r.snippet || '',
269
+ }));
270
+ }
271
+
272
+ // ─── Main Search Function ─────────────────────────────────────────────
273
+
274
+ async function search(query, ipHash) {
275
+ if (!query || !query.trim()) return { results: [], cached: false };
276
+
277
+ const q = query.trim();
278
+
279
+ // Check cache first
280
+ const cached = getCachedResults(q);
281
+ if (cached && cached.length > 0) {
282
+ recordSearch(q, ipHash, cached.length);
283
+ return { results: cached, cached: true };
284
+ }
285
+
286
+ // Fetch from all sources in parallel
287
+ const [ddgResults, googleResults, bingResults] = await Promise.allSettled([
288
+ searchDDG(q),
289
+ searchGoogle(q),
290
+ searchBing(q),
291
+ ]);
292
+
293
+ const allResults = [
294
+ ...(ddgResults.status === 'fulfilled' ? ddgResults.value : []),
295
+ ...(googleResults.status === 'fulfilled' ? googleResults.value : []),
296
+ ...(bingResults.status === 'fulfilled' ? bingResults.value : []),
297
+ ];
298
+
299
+ if (allResults.length === 0) {
300
+ recordSearch(q, ipHash, 0);
301
+ return { results: [], cached: false };
302
+ }
303
+
304
+ // Rank and deduplicate
305
+ const ranked = rankResults(allResults);
306
+
307
+ // Cache results
308
+ setCachedResults(q, ranked, 'multi');
309
+
310
+ // Record search
311
+ recordSearch(q, ipHash, ranked.length);
312
+
313
+ return { results: ranked, cached: false };
314
+ }
315
+
316
+ // ─── Helpers ──────────────────────────────────────────────────────────
317
+
318
+ function stripHtml(s) {
319
+ return (s || '').replace(/<[^>]+>/g, '').trim();
320
+ }
321
+
322
+ function decodeEntities(s) {
323
+ return (s || '')
324
+ .replace(/&amp;/g, '&')
325
+ .replace(/&lt;/g, '<')
326
+ .replace(/&gt;/g, '>')
327
+ .replace(/&quot;/g, '"')
328
+ .replace(/&#x27;/g, "'")
329
+ .replace(/&#39;/g, "'")
330
+ .trim();
331
+ }
332
+
333
+ function normalizeUrl(url) {
334
+ try {
335
+ const u = new URL(url);
336
+ return u.hostname.replace(/^www\./, '') + u.pathname.replace(/\/$/, '') + u.search;
337
+ } catch {
338
+ return url;
339
+ }
340
+ }
341
+
342
+ function safeHostname(url) {
343
+ try {
344
+ return new URL(url).hostname.replace(/^www\./, '');
345
+ } catch {
346
+ return '';
347
+ }
348
+ }
349
+
350
+ module.exports = {
351
+ initSearchEngine,
352
+ search,
353
+ getSuggestions,
354
+ getTrendingSearches,
355
+ getSearchStats,
356
+ purgeOldCache,
357
+ };