web-agent-bridge 2.3.1 → 2.5.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.ar.md +524 -31
- package/README.md +592 -47
- package/bin/agent-runner.js +10 -1
- package/package.json +1 -1
- package/public/agent-workspace.html +347 -0
- package/public/browser.html +484 -0
- package/public/css/agent-workspace.css +1713 -0
- package/public/index.html +94 -0
- package/public/js/agent-workspace.js +1740 -0
- package/sdk/index.d.ts +253 -0
- package/sdk/index.js +360 -1
- package/sdk/package.json +1 -1
- package/server/config/secrets.js +13 -5
- package/server/control-plane/index.js +301 -0
- package/server/data-plane/index.js +354 -0
- package/server/index.js +185 -4
- package/server/llm/index.js +404 -0
- package/server/middleware/adminAuth.js +6 -1
- package/server/middleware/auth.js +11 -2
- package/server/middleware/rateLimits.js +78 -2
- package/server/migrations/003_ads_integer_cents.sql +33 -0
- package/server/models/db.js +126 -25
- package/server/observability/index.js +394 -0
- package/server/protocol/capabilities.js +223 -0
- package/server/protocol/index.js +243 -0
- package/server/protocol/schema.js +584 -0
- package/server/registry/index.js +326 -0
- package/server/routes/admin.js +16 -2
- package/server/routes/ads.js +130 -0
- package/server/routes/agent-workspace.js +378 -0
- package/server/routes/api.js +21 -2
- package/server/routes/auth.js +26 -6
- package/server/routes/runtime.js +725 -0
- package/server/routes/sovereign.js +78 -0
- package/server/routes/universal.js +177 -0
- package/server/routes/wab-api.js +20 -5
- package/server/runtime/event-bus.js +210 -0
- package/server/runtime/index.js +233 -0
- package/server/runtime/sandbox.js +266 -0
- package/server/runtime/scheduler.js +395 -0
- package/server/runtime/state-manager.js +188 -0
- package/server/security/index.js +355 -0
- package/server/services/agent-chat.js +506 -0
- package/server/services/agent-symphony.js +6 -0
- package/server/services/agent-tasks.js +1807 -0
- package/server/services/fairness-engine.js +409 -0
- package/server/services/plugins.js +27 -3
- package/server/services/price-intelligence.js +565 -0
- package/server/services/price-shield.js +1137 -0
- package/server/services/search-engine.js +357 -0
- package/server/services/security.js +513 -0
- package/server/services/universal-scraper.js +661 -0
- package/server/ws.js +61 -1
|
@@ -0,0 +1,357 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* WAB Search Engine — Independent search aggregator with caching,
|
|
3
|
+
* ranking, suggestions, and trending queries.
|
|
4
|
+
*
|
|
5
|
+
* All results are served under the WAB brand — no external engine
|
|
6
|
+
* branding is ever exposed to the user.
|
|
7
|
+
*/
|
|
8
|
+
|
|
9
|
+
const crypto = require('crypto');
|
|
10
|
+
|
|
11
|
+
let db;
|
|
12
|
+
|
|
13
|
+
function initSearchEngine(database) {
|
|
14
|
+
db = database;
|
|
15
|
+
|
|
16
|
+
db.exec(`
|
|
17
|
+
CREATE TABLE IF NOT EXISTS search_cache (
|
|
18
|
+
query_hash TEXT PRIMARY KEY,
|
|
19
|
+
query TEXT NOT NULL,
|
|
20
|
+
results TEXT NOT NULL,
|
|
21
|
+
source TEXT DEFAULT 'multi',
|
|
22
|
+
created_at TEXT DEFAULT (datetime('now')),
|
|
23
|
+
hit_count INTEGER DEFAULT 1
|
|
24
|
+
);
|
|
25
|
+
|
|
26
|
+
CREATE TABLE IF NOT EXISTS search_history (
|
|
27
|
+
id INTEGER PRIMARY KEY AUTOINCREMENT,
|
|
28
|
+
query TEXT NOT NULL,
|
|
29
|
+
ip_hash TEXT,
|
|
30
|
+
results_count INTEGER DEFAULT 0,
|
|
31
|
+
created_at TEXT DEFAULT (datetime('now'))
|
|
32
|
+
);
|
|
33
|
+
|
|
34
|
+
CREATE TABLE IF NOT EXISTS search_suggestions (
|
|
35
|
+
query TEXT PRIMARY KEY,
|
|
36
|
+
frequency INTEGER DEFAULT 1,
|
|
37
|
+
last_searched TEXT DEFAULT (datetime('now'))
|
|
38
|
+
);
|
|
39
|
+
|
|
40
|
+
CREATE INDEX IF NOT EXISTS idx_search_cache_created ON search_cache(created_at);
|
|
41
|
+
CREATE INDEX IF NOT EXISTS idx_search_history_created ON search_history(created_at);
|
|
42
|
+
CREATE INDEX IF NOT EXISTS idx_search_suggestions_freq ON search_suggestions(frequency DESC);
|
|
43
|
+
`);
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
// ─── Cache Layer ──────────────────────────────────────────────────────
|
|
47
|
+
|
|
48
|
+
function queryHash(q) {
|
|
49
|
+
return crypto.createHash('sha256').update(q.toLowerCase().trim()).digest('hex').slice(0, 32);
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
function getCachedResults(query) {
|
|
53
|
+
const hash = queryHash(query);
|
|
54
|
+
const row = db.prepare(
|
|
55
|
+
`SELECT results, created_at FROM search_cache WHERE query_hash = ? AND created_at > datetime('now', '-1 hour')`
|
|
56
|
+
).get(hash);
|
|
57
|
+
if (row) {
|
|
58
|
+
db.prepare(`UPDATE search_cache SET hit_count = hit_count + 1 WHERE query_hash = ?`).run(hash);
|
|
59
|
+
return JSON.parse(row.results);
|
|
60
|
+
}
|
|
61
|
+
return null;
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
function setCachedResults(query, results, source) {
|
|
65
|
+
const hash = queryHash(query);
|
|
66
|
+
db.prepare(
|
|
67
|
+
`INSERT OR REPLACE INTO search_cache (query_hash, query, results, source, created_at, hit_count)
|
|
68
|
+
VALUES (?, ?, ?, ?, datetime('now'), 1)`
|
|
69
|
+
).run(hash, query.toLowerCase().trim(), JSON.stringify(results), source || 'multi');
|
|
70
|
+
}
|
|
71
|
+
|
|
72
|
+
// Purge old cache entries (>24h)
|
|
73
|
+
function purgeOldCache() {
|
|
74
|
+
db.prepare(`DELETE FROM search_cache WHERE created_at < datetime('now', '-1 day')`).run();
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
// ─── Search History & Suggestions ─────────────────────────────────────
|
|
78
|
+
|
|
79
|
+
function recordSearch(query, ipHash, resultsCount) {
|
|
80
|
+
db.prepare(
|
|
81
|
+
`INSERT INTO search_history (query, ip_hash, results_count) VALUES (?, ?, ?)`
|
|
82
|
+
).run(query.trim(), ipHash || null, resultsCount);
|
|
83
|
+
|
|
84
|
+
// Update suggestion frequency
|
|
85
|
+
const normalized = query.toLowerCase().trim();
|
|
86
|
+
if (normalized.length >= 2 && normalized.length <= 100) {
|
|
87
|
+
const existing = db.prepare(`SELECT frequency FROM search_suggestions WHERE query = ?`).get(normalized);
|
|
88
|
+
if (existing) {
|
|
89
|
+
db.prepare(`UPDATE search_suggestions SET frequency = frequency + 1, last_searched = datetime('now') WHERE query = ?`).run(normalized);
|
|
90
|
+
} else {
|
|
91
|
+
db.prepare(`INSERT INTO search_suggestions (query, frequency) VALUES (?, 1)`).run(normalized);
|
|
92
|
+
}
|
|
93
|
+
}
|
|
94
|
+
}
|
|
95
|
+
|
|
96
|
+
function getSuggestions(prefix, limit = 8) {
|
|
97
|
+
if (!prefix || prefix.length < 1) return [];
|
|
98
|
+
const normalized = prefix.toLowerCase().trim();
|
|
99
|
+
return db.prepare(
|
|
100
|
+
`SELECT query, frequency FROM search_suggestions
|
|
101
|
+
WHERE query LIKE ? AND frequency > 0
|
|
102
|
+
ORDER BY frequency DESC, last_searched DESC LIMIT ?`
|
|
103
|
+
).all(normalized + '%', limit).map(r => r.query);
|
|
104
|
+
}
|
|
105
|
+
|
|
106
|
+
function getTrendingSearches(limit = 10) {
|
|
107
|
+
return db.prepare(
|
|
108
|
+
`SELECT query, COUNT(*) as count FROM search_history
|
|
109
|
+
WHERE created_at > datetime('now', '-24 hours')
|
|
110
|
+
GROUP BY LOWER(query) ORDER BY count DESC LIMIT ?`
|
|
111
|
+
).all(limit).map(r => ({ query: r.query, count: r.count }));
|
|
112
|
+
}
|
|
113
|
+
|
|
114
|
+
function getSearchStats() {
|
|
115
|
+
const total = db.prepare(`SELECT COUNT(*) as c FROM search_history`).get().c;
|
|
116
|
+
const today = db.prepare(`SELECT COUNT(*) as c FROM search_history WHERE created_at > datetime('now', '-24 hours')`).get().c;
|
|
117
|
+
const cached = db.prepare(`SELECT COUNT(*) as c FROM search_cache`).get().c;
|
|
118
|
+
const uniqueQueries = db.prepare(`SELECT COUNT(DISTINCT LOWER(query)) as c FROM search_history`).get().c;
|
|
119
|
+
return { total, today, cached, uniqueQueries };
|
|
120
|
+
}
|
|
121
|
+
|
|
122
|
+
// ─── Multi-Source Search ──────────────────────────────────────────────
|
|
123
|
+
|
|
124
|
+
const UA = 'Mozilla/5.0 (Linux; Android 13) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36';
|
|
125
|
+
const HEADERS = {
|
|
126
|
+
'User-Agent': UA,
|
|
127
|
+
'Accept': 'text/html',
|
|
128
|
+
'Accept-Language': 'en-US,en;q=0.9,ar;q=0.8',
|
|
129
|
+
};
|
|
130
|
+
|
|
131
|
+
async function searchDDG(q) {
|
|
132
|
+
try {
|
|
133
|
+
const url = 'https://html.duckduckgo.com/html/?q=' + encodeURIComponent(q);
|
|
134
|
+
const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
|
|
135
|
+
const html = await resp.text();
|
|
136
|
+
const results = [];
|
|
137
|
+
const resultPattern = /<a[^>]+class="result__a"[^>]+href="([^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
|
|
138
|
+
const snippetPattern = /<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/gi;
|
|
139
|
+
const urls = [], titles = [], snippets = [];
|
|
140
|
+
let m;
|
|
141
|
+
while ((m = resultPattern.exec(html)) !== null) {
|
|
142
|
+
urls.push(m[1]);
|
|
143
|
+
titles.push(stripHtml(m[2]));
|
|
144
|
+
}
|
|
145
|
+
while ((m = snippetPattern.exec(html)) !== null) {
|
|
146
|
+
snippets.push(decodeEntities(stripHtml(m[1])));
|
|
147
|
+
}
|
|
148
|
+
for (let i = 0; i < Math.min(urls.length, 15); i++) {
|
|
149
|
+
let u = urls[i];
|
|
150
|
+
const uddg = u.match(/uddg=([^&]+)/);
|
|
151
|
+
if (uddg) u = decodeURIComponent(uddg[1]);
|
|
152
|
+
if (!u.startsWith('http')) continue;
|
|
153
|
+
results.push({ title: titles[i] || u, url: u, snippet: snippets[i] || '', source: 'ddg' });
|
|
154
|
+
}
|
|
155
|
+
return results;
|
|
156
|
+
} catch (e) {
|
|
157
|
+
return [];
|
|
158
|
+
}
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
async function searchGoogle(q) {
|
|
162
|
+
try {
|
|
163
|
+
const url = 'https://www.google.com/search?q=' + encodeURIComponent(q) + '&num=15&hl=en';
|
|
164
|
+
const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
|
|
165
|
+
const html = await resp.text();
|
|
166
|
+
const results = [];
|
|
167
|
+
const linkPattern = /<a[^>]+href="\/url\?q=([^&"]+)[^"]*"[^>]*>([\s\S]*?)<\/a>/gi;
|
|
168
|
+
let m;
|
|
169
|
+
while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
|
|
170
|
+
const u = decodeURIComponent(m[1]);
|
|
171
|
+
if (!u.startsWith('http')) continue;
|
|
172
|
+
try { if (new URL(u).hostname.includes('google.')) continue; } catch { continue; }
|
|
173
|
+
const title = stripHtml(m[2]);
|
|
174
|
+
if (!title) continue;
|
|
175
|
+
results.push({ title, url: u, snippet: '', source: 'google' });
|
|
176
|
+
}
|
|
177
|
+
return results;
|
|
178
|
+
} catch (e) {
|
|
179
|
+
return [];
|
|
180
|
+
}
|
|
181
|
+
}
|
|
182
|
+
|
|
183
|
+
async function searchBing(q) {
|
|
184
|
+
try {
|
|
185
|
+
const url = 'https://www.bing.com/search?q=' + encodeURIComponent(q) + '&count=15';
|
|
186
|
+
const resp = await fetch(url, { headers: HEADERS, signal: AbortSignal.timeout(8000) });
|
|
187
|
+
const html = await resp.text();
|
|
188
|
+
const results = [];
|
|
189
|
+
// Bing result links: <a href="URL" h="ID=..."><strong>title</strong></a>
|
|
190
|
+
const linkPattern = /<li class="b_algo"[^>]*>[\s\S]*?<a[^>]+href="(https?:\/\/[^"]+)"[^>]*>([\s\S]*?)<\/a>[\s\S]*?<p[^>]*>([\s\S]*?)<\/p>/gi;
|
|
191
|
+
let m;
|
|
192
|
+
while ((m = linkPattern.exec(html)) !== null && results.length < 15) {
|
|
193
|
+
const u = m[1];
|
|
194
|
+
if (!u.startsWith('http')) continue;
|
|
195
|
+
try { if (new URL(u).hostname.includes('bing.')) continue; } catch { continue; }
|
|
196
|
+
const title = stripHtml(m[2]);
|
|
197
|
+
const snippet = decodeEntities(stripHtml(m[3]));
|
|
198
|
+
if (!title) continue;
|
|
199
|
+
results.push({ title, url: u, snippet, source: 'bing' });
|
|
200
|
+
}
|
|
201
|
+
return results;
|
|
202
|
+
} catch (e) {
|
|
203
|
+
return [];
|
|
204
|
+
}
|
|
205
|
+
}
|
|
206
|
+
|
|
207
|
+
// ─── Result Ranking Engine ────────────────────────────────────────────
|
|
208
|
+
|
|
209
|
+
function rankResults(allResults) {
|
|
210
|
+
// Deduplicate by URL (keep the one with the best snippet)
|
|
211
|
+
const seen = new Map();
|
|
212
|
+
for (const r of allResults) {
|
|
213
|
+
const normalizedUrl = normalizeUrl(r.url);
|
|
214
|
+
const existing = seen.get(normalizedUrl);
|
|
215
|
+
if (!existing) {
|
|
216
|
+
seen.set(normalizedUrl, { ...r, sourceCount: 1 });
|
|
217
|
+
} else {
|
|
218
|
+
existing.sourceCount++;
|
|
219
|
+
// Prefer the version with a snippet
|
|
220
|
+
if (!existing.snippet && r.snippet) {
|
|
221
|
+
existing.snippet = r.snippet;
|
|
222
|
+
}
|
|
223
|
+
// Prefer longer title
|
|
224
|
+
if (r.title.length > existing.title.length) {
|
|
225
|
+
existing.title = r.title;
|
|
226
|
+
}
|
|
227
|
+
}
|
|
228
|
+
}
|
|
229
|
+
|
|
230
|
+
const deduplicated = Array.from(seen.values());
|
|
231
|
+
|
|
232
|
+
// Score each result
|
|
233
|
+
for (const r of deduplicated) {
|
|
234
|
+
let score = 0;
|
|
235
|
+
|
|
236
|
+
// Multi-source bonus: appearing in multiple engines means higher relevance
|
|
237
|
+
score += (r.sourceCount - 1) * 30;
|
|
238
|
+
|
|
239
|
+
// Snippet presence
|
|
240
|
+
if (r.snippet && r.snippet.length > 20) score += 15;
|
|
241
|
+
|
|
242
|
+
// HTTPS bonus
|
|
243
|
+
if (r.url.startsWith('https://')) score += 5;
|
|
244
|
+
|
|
245
|
+
// Domain diversity: boost independent/small sites
|
|
246
|
+
const hostname = safeHostname(r.url);
|
|
247
|
+
const bigTech = ['google.com','youtube.com','facebook.com','amazon.com','apple.com','microsoft.com','twitter.com','x.com','instagram.com','tiktok.com','linkedin.com','reddit.com','pinterest.com'];
|
|
248
|
+
const isBigTech = bigTech.some(d => hostname === d || hostname.endsWith('.' + d));
|
|
249
|
+
if (!isBigTech) score += 8;
|
|
250
|
+
|
|
251
|
+
// Trusted TLDs
|
|
252
|
+
const tld = hostname.split('.').pop();
|
|
253
|
+
if (['org','edu','gov','dev'].includes(tld)) score += 5;
|
|
254
|
+
|
|
255
|
+
// Penalize very long URLs (likely junk)
|
|
256
|
+
if (r.url.length > 200) score -= 10;
|
|
257
|
+
|
|
258
|
+
r.score = score;
|
|
259
|
+
}
|
|
260
|
+
|
|
261
|
+
// Sort by score descending, then by original order
|
|
262
|
+
deduplicated.sort((a, b) => b.score - a.score);
|
|
263
|
+
|
|
264
|
+
// Return top 15, strip internal fields
|
|
265
|
+
return deduplicated.slice(0, 15).map(r => ({
|
|
266
|
+
title: r.title,
|
|
267
|
+
url: r.url,
|
|
268
|
+
snippet: r.snippet || '',
|
|
269
|
+
}));
|
|
270
|
+
}
|
|
271
|
+
|
|
272
|
+
// ─── Main Search Function ─────────────────────────────────────────────
|
|
273
|
+
|
|
274
|
+
async function search(query, ipHash) {
|
|
275
|
+
if (!query || !query.trim()) return { results: [], cached: false };
|
|
276
|
+
|
|
277
|
+
const q = query.trim();
|
|
278
|
+
|
|
279
|
+
// Check cache first
|
|
280
|
+
const cached = getCachedResults(q);
|
|
281
|
+
if (cached && cached.length > 0) {
|
|
282
|
+
recordSearch(q, ipHash, cached.length);
|
|
283
|
+
return { results: cached, cached: true };
|
|
284
|
+
}
|
|
285
|
+
|
|
286
|
+
// Fetch from all sources in parallel
|
|
287
|
+
const [ddgResults, googleResults, bingResults] = await Promise.allSettled([
|
|
288
|
+
searchDDG(q),
|
|
289
|
+
searchGoogle(q),
|
|
290
|
+
searchBing(q),
|
|
291
|
+
]);
|
|
292
|
+
|
|
293
|
+
const allResults = [
|
|
294
|
+
...(ddgResults.status === 'fulfilled' ? ddgResults.value : []),
|
|
295
|
+
...(googleResults.status === 'fulfilled' ? googleResults.value : []),
|
|
296
|
+
...(bingResults.status === 'fulfilled' ? bingResults.value : []),
|
|
297
|
+
];
|
|
298
|
+
|
|
299
|
+
if (allResults.length === 0) {
|
|
300
|
+
recordSearch(q, ipHash, 0);
|
|
301
|
+
return { results: [], cached: false };
|
|
302
|
+
}
|
|
303
|
+
|
|
304
|
+
// Rank and deduplicate
|
|
305
|
+
const ranked = rankResults(allResults);
|
|
306
|
+
|
|
307
|
+
// Cache results
|
|
308
|
+
setCachedResults(q, ranked, 'multi');
|
|
309
|
+
|
|
310
|
+
// Record search
|
|
311
|
+
recordSearch(q, ipHash, ranked.length);
|
|
312
|
+
|
|
313
|
+
return { results: ranked, cached: false };
|
|
314
|
+
}
|
|
315
|
+
|
|
316
|
+
// ─── Helpers ──────────────────────────────────────────────────────────
|
|
317
|
+
|
|
318
|
+
function stripHtml(s) {
|
|
319
|
+
return (s || '').replace(/<[^>]+>/g, '').trim();
|
|
320
|
+
}
|
|
321
|
+
|
|
322
|
+
function decodeEntities(s) {
|
|
323
|
+
return (s || '')
|
|
324
|
+
.replace(/&/g, '&')
|
|
325
|
+
.replace(/</g, '<')
|
|
326
|
+
.replace(/>/g, '>')
|
|
327
|
+
.replace(/"/g, '"')
|
|
328
|
+
.replace(/'/g, "'")
|
|
329
|
+
.replace(/'/g, "'")
|
|
330
|
+
.trim();
|
|
331
|
+
}
|
|
332
|
+
|
|
333
|
+
function normalizeUrl(url) {
|
|
334
|
+
try {
|
|
335
|
+
const u = new URL(url);
|
|
336
|
+
return u.hostname.replace(/^www\./, '') + u.pathname.replace(/\/$/, '') + u.search;
|
|
337
|
+
} catch {
|
|
338
|
+
return url;
|
|
339
|
+
}
|
|
340
|
+
}
|
|
341
|
+
|
|
342
|
+
function safeHostname(url) {
|
|
343
|
+
try {
|
|
344
|
+
return new URL(url).hostname.replace(/^www\./, '');
|
|
345
|
+
} catch {
|
|
346
|
+
return '';
|
|
347
|
+
}
|
|
348
|
+
}
|
|
349
|
+
|
|
350
|
+
module.exports = {
|
|
351
|
+
initSearchEngine,
|
|
352
|
+
search,
|
|
353
|
+
getSuggestions,
|
|
354
|
+
getTrendingSearches,
|
|
355
|
+
getSearchStats,
|
|
356
|
+
purgeOldCache,
|
|
357
|
+
};
|