web-agent-bridge 3.4.0 → 3.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +84 -84
- package/README.ar.md +1565 -1304
- package/README.md +171 -298
- package/bin/agent-runner.js +474 -474
- package/bin/cli.js +237 -237
- package/bin/wab-init.js +244 -223
- package/bin/wab.js +80 -80
- package/examples/azure-dns-wab.js +83 -83
- package/examples/bidi-agent.js +119 -119
- package/examples/cloudflare-wab-dns.js +121 -121
- package/examples/cpanel-wab-dns.js +114 -114
- package/examples/cross-site-agent.js +91 -91
- package/examples/dns-discovery-agent.js +166 -166
- package/examples/gcp-dns-wab.js +76 -76
- package/examples/governance-agent.js +169 -169
- package/examples/mcp-agent.js +94 -94
- package/examples/next-app-router/README.md +44 -44
- package/examples/plesk-wab-dns.js +103 -103
- package/examples/puppeteer-agent.js +108 -108
- package/examples/route53-wab-dns.js +144 -144
- package/examples/saas-dashboard/README.md +55 -55
- package/examples/safe-mode-agent.js +96 -96
- package/examples/self-discovery.js +106 -0
- package/examples/shopify-hydrogen/README.md +74 -74
- package/examples/vision-agent.js +171 -171
- package/examples/wab-sign.js +74 -74
- package/examples/wab-verify.js +60 -60
- package/examples/wordpress-elementor/README.md +77 -77
- package/package.json +93 -93
- package/public/.well-known/agent-tools.json +180 -180
- package/public/.well-known/ai-assets.json +59 -59
- package/public/.well-known/security.txt +8 -8
- package/public/.well-known/wab.json +28 -28
- package/public/activate.html +448 -368
- package/public/adopt.html +236 -0
- package/public/adoption-metrics.html +188 -188
- package/public/agent-workspace.html +359 -349
- package/public/ai.html +198 -198
- package/public/api.html +397 -413
- package/public/atp.html +171 -0
- package/public/azure-dns-integration.html +289 -289
- package/public/browser.html +486 -486
- package/public/cloudflare-integration.html +380 -380
- package/public/commander-dashboard.html +243 -243
- package/public/cookies.html +210 -210
- package/public/cpanel-integration.html +398 -398
- package/public/css/agent-workspace.css +1713 -1713
- package/public/css/premium.css +317 -317
- package/public/css/styles.css +1401 -1263
- package/public/dashboard-shieldlink.html +295 -0
- package/public/dashboard.html +711 -707
- package/public/dns.html +436 -436
- package/public/docs.html +588 -588
- package/public/enterprise-mesh.ar.html +80 -0
- package/public/enterprise-mesh.html +81 -0
- package/public/feed.xml +89 -89
- package/public/gcp-dns-integration.html +318 -318
- package/public/governance.ar.html +70 -0
- package/public/governance.html +69 -0
- package/public/growth.html +465 -465
- package/public/index.html +1372 -1266
- package/public/integrations.html +556 -556
- package/public/js/activate.js +449 -145
- package/public/js/agent-workspace.js +1740 -1740
- package/public/js/auth-nav.js +117 -65
- package/public/js/auth-redirect.js +12 -12
- package/public/js/cookie-consent.js +56 -56
- package/public/js/dns.js +438 -438
- package/public/js/wab-demo-page.js +721 -721
- package/public/js/ws-client.js +74 -74
- package/public/l-preview.html +242 -0
- package/public/llms-full.txt +360 -360
- package/public/llms.txt +125 -125
- package/public/login.html +85 -85
- package/public/mesh-dashboard.html +328 -328
- package/public/milestones.html +346 -0
- package/public/one-click.html +779 -0
- package/public/openapi.json +669 -669
- package/public/partners.ar.html +145 -0
- package/public/partners.html +143 -0
- package/public/phone-shield.html +281 -281
- package/public/plesk-integration.html +375 -375
- package/public/premium-dashboard.html +2489 -2489
- package/public/premium.html +793 -793
- package/public/privacy.html +297 -297
- package/public/provider-onboarding.html +172 -172
- package/public/provider-sandbox.html +134 -134
- package/public/providers.html +359 -359
- package/public/refusals.html +172 -0
- package/public/register.html +105 -105
- package/public/registrar-integrations.html +141 -141
- package/public/ring4.html +292 -0
- package/public/robots.txt +99 -99
- package/public/route53-integration.html +531 -531
- package/public/score.html +263 -0
- package/public/script/wab-consent.d.ts +36 -36
- package/public/script/wab-consent.js +104 -104
- package/public/script/wab-schema.js +131 -131
- package/public/script/wab.d.ts +108 -108
- package/public/script/wab.min.js +580 -580
- package/public/security.txt +8 -8
- package/public/shieldlink.html +244 -0
- package/public/shieldqr.html +231 -231
- package/public/sitemap.xml +13 -1
- package/public/terms.html +256 -256
- package/public/trust-graph-api.ar.html +92 -0
- package/public/trust-graph-api.html +91 -0
- package/public/wab-features.html +560 -0
- package/public/wab-trust.html +200 -200
- package/public/wab-truth.html +375 -0
- package/public/wab-vs-protocols.html +210 -210
- package/public/whitepaper.html +449 -449
- package/script/ai-agent-bridge.js +1754 -1754
- package/sdk/README.md +99 -99
- package/sdk/agent-mesh.js +449 -449
- package/sdk/atp.js +103 -0
- package/sdk/auto-discovery.js +301 -288
- package/sdk/commander.js +262 -262
- package/sdk/governance.js +262 -262
- package/sdk/index.d.ts +464 -464
- package/sdk/index.js +653 -649
- package/sdk/multi-agent.js +318 -318
- package/sdk/safe-mode.js +221 -221
- package/sdk/safety-shield.js +219 -219
- package/sdk/schema-discovery.js +83 -83
- package/server/adapters/index.js +520 -520
- package/server/config/plans.js +412 -367
- package/server/config/secrets.js +102 -102
- package/server/control-plane/index.js +301 -301
- package/server/data-plane/index.js +354 -354
- package/server/index.js +793 -670
- package/server/llm/index.js +404 -404
- package/server/middleware/adminAuth.js +35 -35
- package/server/middleware/api-tier.js +170 -0
- package/server/middleware/auth.js +50 -50
- package/server/middleware/featureGate.js +88 -88
- package/server/middleware/rateLimits.js +100 -100
- package/server/middleware/sensitiveAction.js +157 -157
- package/server/middleware/wab-trust.js +141 -0
- package/server/migrations/001_add_analytics_indexes.sql +7 -7
- package/server/migrations/002_premium_features.sql +418 -418
- package/server/migrations/003_ads_integer_cents.sql +33 -33
- package/server/migrations/004_agent_os.sql +158 -158
- package/server/migrations/005_marketplace_metering.sql +126 -126
- package/server/migrations/006_growth_suite.sql +138 -0
- package/server/migrations/007_governance.sql +106 -106
- package/server/migrations/008_plans.sql +144 -144
- package/server/migrations/009_shieldqr.sql +30 -30
- package/server/migrations/010_extended_trust.sql +33 -33
- package/server/migrations/011_outreach.sql +47 -0
- package/server/migrations/012_shieldlink.sql +116 -0
- package/server/migrations/013_ct_monitor.sql +13 -0
- package/server/migrations/014_wab_advanced_features.sql +128 -0
- package/server/migrations/015_wab_truth_layer.sql +101 -0
- package/server/migrations/016_ring4_external_trust.sql +84 -0
- package/server/migrations/017_ring4_extensions.sql +69 -0
- package/server/migrations/018_commercial_foundations.sql +167 -0
- package/server/migrations/019_unify_tier_constraints.sql +133 -0
- package/server/migrations/020_agent_transaction_primitive.sql +119 -0
- package/server/models/adapters/index.js +33 -33
- package/server/models/adapters/mysql.js +183 -183
- package/server/models/adapters/postgresql.js +172 -172
- package/server/models/adapters/sqlite.js +7 -7
- package/server/models/db.js +740 -740
- package/server/observability/failure-analysis.js +337 -337
- package/server/observability/index.js +394 -394
- package/server/protocol/capabilities.js +223 -223
- package/server/protocol/index.js +243 -243
- package/server/protocol/schema.js +584 -584
- package/server/registry/certification.js +271 -271
- package/server/registry/index.js +326 -326
- package/server/routes/activate.js +478 -0
- package/server/routes/admin-outreach.js +239 -0
- package/server/routes/admin-plans.js +76 -76
- package/server/routes/admin-premium.js +674 -673
- package/server/routes/admin-shieldlink.js +137 -0
- package/server/routes/admin-shieldqr.js +90 -90
- package/server/routes/admin-trust-monitor.js +139 -83
- package/server/routes/admin.js +550 -549
- package/server/routes/adopt.js +61 -0
- package/server/routes/ads.js +130 -130
- package/server/routes/agent-workspace.js +540 -540
- package/server/routes/api-keys.js +127 -0
- package/server/routes/api.js +150 -150
- package/server/routes/auth.js +71 -71
- package/server/routes/billing.js +57 -57
- package/server/routes/commander.js +316 -316
- package/server/routes/customer-shieldlink.js +133 -0
- package/server/routes/demo-showcase.js +332 -332
- package/server/routes/demo-store.js +154 -154
- package/server/routes/diagnose.js +373 -0
- package/server/routes/discovery.js +2348 -2348
- package/server/routes/enterprise-mesh.js +170 -0
- package/server/routes/gateway.js +173 -173
- package/server/routes/governance-saas.js +203 -0
- package/server/routes/governance.js +208 -208
- package/server/routes/growth.js +1048 -0
- package/server/routes/intent.js +328 -0
- package/server/routes/license.js +251 -251
- package/server/routes/mesh.js +469 -469
- package/server/routes/noscript.js +543 -543
- package/server/routes/partners.js +201 -0
- package/server/routes/plans.js +33 -33
- package/server/routes/premium-v2.js +686 -686
- package/server/routes/premium.js +724 -724
- package/server/routes/providers.js +650 -650
- package/server/routes/reputation.js +411 -0
- package/server/routes/ring4.js +885 -0
- package/server/routes/runtime.js +2148 -2148
- package/server/routes/shieldlink.js +70 -0
- package/server/routes/shieldqr.js +88 -88
- package/server/routes/sovereign.js +465 -465
- package/server/routes/transactions.js +233 -0
- package/server/routes/truth-layer.js +670 -0
- package/server/routes/universal.js +200 -200
- package/server/routes/unsubscribe.js +51 -0
- package/server/routes/wab-api.js +850 -850
- package/server/routes/wab-cache.js +282 -0
- package/server/runtime/container-worker.js +111 -111
- package/server/runtime/container.js +448 -448
- package/server/runtime/distributed-worker.js +362 -362
- package/server/runtime/event-bus.js +210 -210
- package/server/runtime/index.js +253 -253
- package/server/runtime/queue.js +599 -599
- package/server/runtime/replay.js +666 -666
- package/server/runtime/sandbox.js +266 -266
- package/server/runtime/scheduler.js +534 -534
- package/server/runtime/session-engine.js +293 -293
- package/server/runtime/state-manager.js +188 -188
- package/server/secrets/wab-signing-key.pem +3 -0
- package/server/secrets/wab-signing-pub.pem +3 -0
- package/server/security/cross-site-redactor.js +196 -196
- package/server/security/dry-run.js +180 -180
- package/server/security/human-gate-rate-limit.js +147 -147
- package/server/security/human-gate-transports.js +178 -178
- package/server/security/human-gate.js +281 -281
- package/server/security/index.js +368 -368
- package/server/security/intent-engine.js +245 -245
- package/server/security/reward-guard.js +171 -171
- package/server/security/rollback-store.js +239 -239
- package/server/security/token-scope.js +404 -404
- package/server/security/url-policy.js +139 -139
- package/server/services/adoption-agent.js +182 -0
- package/server/services/agent-chat.js +506 -506
- package/server/services/agent-learning.js +601 -601
- package/server/services/agent-memory.js +625 -625
- package/server/services/agent-mesh.js +555 -555
- package/server/services/agent-symphony.js +717 -717
- package/server/services/agent-tasks.js +1807 -1807
- package/server/services/api-key-engine.js +292 -292
- package/server/services/cluster.js +894 -894
- package/server/services/commander.js +738 -738
- package/server/services/edge-compute.js +440 -440
- package/server/services/email.js +233 -233
- package/server/services/fairness-engine.js +409 -0
- package/server/services/fairness.js +420 -0
- package/server/services/governance.js +466 -466
- package/server/services/hosted-runtime.js +205 -205
- package/server/services/lfd.js +635 -635
- package/server/services/local-ai.js +389 -389
- package/server/services/marketplace.js +270 -270
- package/server/services/metering.js +182 -182
- package/server/services/modules/affiliate-intelligence.js +93 -93
- package/server/services/modules/agent-firewall.js +90 -90
- package/server/services/modules/bounty.js +89 -89
- package/server/services/modules/collective-bargaining.js +92 -92
- package/server/services/modules/dark-pattern.js +66 -66
- package/server/services/modules/gov-intelligence.js +45 -45
- package/server/services/modules/neural.js +55 -55
- package/server/services/modules/notary.js +49 -49
- package/server/services/modules/price-time-machine.js +86 -86
- package/server/services/modules/protocol.js +104 -104
- package/server/services/negotiation.js +439 -439
- package/server/services/outreach-agent.js +312 -0
- package/server/services/plans.js +214 -214
- package/server/services/plugins.js +771 -771
- package/server/services/price-intelligence.js +566 -566
- package/server/services/price-shield.js +1137 -1137
- package/server/services/provider-clients.js +740 -740
- package/server/services/reputation.js +465 -465
- package/server/services/search-engine.js +357 -357
- package/server/services/security.js +513 -513
- package/server/services/self-healing.js +843 -843
- package/server/services/shieldlink.js +492 -0
- package/server/services/shieldqr.js +322 -322
- package/server/services/sovereign-shield.js +542 -542
- package/server/services/ssl-ct-monitor.js +224 -0
- package/server/services/ssl-inspector.js +42 -42
- package/server/services/ssl-monitor.js +167 -167
- package/server/services/stripe.js +206 -205
- package/server/services/swarm.js +788 -788
- package/server/services/transactions.js +525 -0
- package/server/services/universal-scraper.js +662 -662
- package/server/services/verification.js +481 -481
- package/server/services/vision.js +1163 -1163
- package/server/services/wab-crypto.js +178 -178
- package/server/utils/cache.js +125 -125
- package/server/utils/migrate.js +81 -81
- package/server/utils/safe-fetch.js +228 -228
- package/server/utils/secureFields.js +50 -50
- package/server/ws.js +161 -161
- package/templates/artisan-marketplace.yaml +104 -104
- package/templates/book-price-scout.yaml +98 -98
- package/templates/electronics-price-tracker.yaml +108 -108
- package/templates/flight-deal-hunter.yaml +113 -113
- package/templates/freelancer-direct.yaml +116 -116
- package/templates/grocery-price-compare.yaml +93 -93
- package/templates/hotel-direct-booking.yaml +113 -113
- package/templates/local-services.yaml +98 -98
- package/templates/olive-oil-tunisia.yaml +88 -88
- package/templates/organic-farm-fresh.yaml +101 -101
- package/templates/restaurant-direct.yaml +97 -97
- package/templates/ring4/banking-sovereign.yaml +55 -0
- package/templates/ring4/ecommerce-sovereign.yaml +58 -0
- package/templates/ring4/healthcare-sovereign.yaml +60 -0
|
@@ -1,139 +1,139 @@
|
|
|
1
|
-
'use strict';
|
|
2
|
-
|
|
3
|
-
/**
|
|
4
|
-
* URL Policy — guards public endpoints (e.g. /api/universal/extract) that
|
|
5
|
-
* accept arbitrary user URLs. Layered on top of the SSRF guard in
|
|
6
|
-
* server/utils/safe-fetch.js, this module enforces:
|
|
7
|
-
*
|
|
8
|
-
* 1. Scheme allow-list (https only by default).
|
|
9
|
-
* 2. TLD/host denylist (configurable via WAB_URL_DENY_HOSTS / DEFAULT_DENY).
|
|
10
|
-
* 3. Path denylist for obvious admin/credential/wp-login style targets that
|
|
11
|
-
* would suggest abuse.
|
|
12
|
-
* 4. Per-actor (IP / API-key / siteId) rate-limit independent of express
|
|
13
|
-
* router-level rate limiting.
|
|
14
|
-
*
|
|
15
|
-
* Decisions are recorded in `url_policy_audit` for review.
|
|
16
|
-
*/
|
|
17
|
-
|
|
18
|
-
const crypto = require('crypto');
|
|
19
|
-
const { db } = require('../models/db');
|
|
20
|
-
|
|
21
|
-
const DEFAULT_DENY_HOSTS = [
|
|
22
|
-
// Local/private/metadata is already blocked by safe-fetch; these are
|
|
23
|
-
// additional public hosts that have no legitimate scraping use case.
|
|
24
|
-
'login.microsoftonline.com',
|
|
25
|
-
'accounts.google.com',
|
|
26
|
-
'appleid.apple.com',
|
|
27
|
-
];
|
|
28
|
-
|
|
29
|
-
const DEFAULT_DENY_PATH_RE = /\/(?:wp-(?:login|admin)|administrator|phpmyadmin|\.git|\.env)(?:\/|\.|$|\?)/i;
|
|
30
|
-
|
|
31
|
-
const RATE_WINDOW_MS = 60_000;
|
|
32
|
-
const RATE_MAX = parseInt(process.env.WAB_URL_POLICY_RATE_MAX || '30', 10);
|
|
33
|
-
|
|
34
|
-
function _envHosts() {
|
|
35
|
-
return String(process.env.WAB_URL_DENY_HOSTS || '')
|
|
36
|
-
.split(',').map((s) => s.trim().toLowerCase()).filter(Boolean);
|
|
37
|
-
}
|
|
38
|
-
|
|
39
|
-
db.exec(`
|
|
40
|
-
CREATE TABLE IF NOT EXISTS url_policy_audit (
|
|
41
|
-
id TEXT PRIMARY KEY,
|
|
42
|
-
actor TEXT,
|
|
43
|
-
url TEXT,
|
|
44
|
-
decision TEXT NOT NULL CHECK(decision IN ('allowed','blocked','rate_limited')),
|
|
45
|
-
reason TEXT,
|
|
46
|
-
created_at TEXT DEFAULT (datetime('now'))
|
|
47
|
-
);
|
|
48
|
-
CREATE INDEX IF NOT EXISTS idx_urlpolicy_decision ON url_policy_audit(decision);
|
|
49
|
-
`);
|
|
50
|
-
|
|
51
|
-
const _rate = new Map(); // actor → [ts]
|
|
52
|
-
|
|
53
|
-
function _hit(actor) {
|
|
54
|
-
const now = Date.now();
|
|
55
|
-
const arr = (_rate.get(actor) || []).filter((t) => now - t < RATE_WINDOW_MS);
|
|
56
|
-
arr.push(now);
|
|
57
|
-
_rate.set(actor, arr);
|
|
58
|
-
return arr.length;
|
|
59
|
-
}
|
|
60
|
-
|
|
61
|
-
function _audit(actor, url, decision, reason) {
|
|
62
|
-
try {
|
|
63
|
-
db.prepare(`INSERT INTO url_policy_audit (id, actor, url, decision, reason)
|
|
64
|
-
VALUES (?, ?, ?, ?, ?)`).run(
|
|
65
|
-
crypto.randomUUID(), actor || null, url || null, decision, reason || null);
|
|
66
|
-
} catch (_) { /* never block on audit failure */ }
|
|
67
|
-
}
|
|
68
|
-
|
|
69
|
-
/**
|
|
70
|
-
* @param {string} rawUrl
|
|
71
|
-
* @param {object} opts
|
|
72
|
-
* @param {string} [opts.actor] - IP, API key id, or site id
|
|
73
|
-
* @returns {{ ok:boolean, reason?:string, code?:string, parsed?:URL }}
|
|
74
|
-
*/
|
|
75
|
-
function check(rawUrl, opts = {}) {
|
|
76
|
-
const actor = opts.actor || 'anon';
|
|
77
|
-
|
|
78
|
-
if (typeof rawUrl !== 'string' || rawUrl.length === 0) {
|
|
79
|
-
_audit(actor, String(rawUrl).slice(0, 200), 'blocked', 'missing_url');
|
|
80
|
-
return { ok: false, reason: 'URL is required', code: 'MISSING_URL' };
|
|
81
|
-
}
|
|
82
|
-
if (rawUrl.length > 2048) {
|
|
83
|
-
_audit(actor, rawUrl.slice(0, 200), 'blocked', 'url_too_long');
|
|
84
|
-
return { ok: false, reason: 'URL exceeds 2048 characters', code: 'URL_TOO_LONG' };
|
|
85
|
-
}
|
|
86
|
-
|
|
87
|
-
let parsed;
|
|
88
|
-
try { parsed = new URL(rawUrl); }
|
|
89
|
-
catch {
|
|
90
|
-
_audit(actor, rawUrl.slice(0, 200), 'blocked', 'invalid_url');
|
|
91
|
-
return { ok: false, reason: 'Invalid URL', code: 'INVALID_URL' };
|
|
92
|
-
}
|
|
93
|
-
|
|
94
|
-
if (parsed.protocol !== 'https:' && parsed.protocol !== 'http:') {
|
|
95
|
-
_audit(actor, rawUrl, 'blocked', `scheme:${parsed.protocol}`);
|
|
96
|
-
return { ok: false, reason: `Scheme ${parsed.protocol} not allowed`, code: 'BAD_SCHEME' };
|
|
97
|
-
}
|
|
98
|
-
if (process.env.WAB_URL_POLICY_HTTPS_ONLY === '1' && parsed.protocol !== 'https:') {
|
|
99
|
-
_audit(actor, rawUrl, 'blocked', 'http_disallowed');
|
|
100
|
-
return { ok: false, reason: 'HTTPS required', code: 'HTTPS_REQUIRED' };
|
|
101
|
-
}
|
|
102
|
-
|
|
103
|
-
const host = parsed.hostname.toLowerCase();
|
|
104
|
-
const deny = new Set([...DEFAULT_DENY_HOSTS, ..._envHosts()]);
|
|
105
|
-
if (deny.has(host)) {
|
|
106
|
-
_audit(actor, rawUrl, 'blocked', `host_denied:${host}`);
|
|
107
|
-
return { ok: false, reason: `Host ${host} is denied by policy`, code: 'HOST_DENIED' };
|
|
108
|
-
}
|
|
109
|
-
|
|
110
|
-
if (DEFAULT_DENY_PATH_RE.test(parsed.pathname)) {
|
|
111
|
-
_audit(actor, rawUrl, 'blocked', `path_denied:${parsed.pathname}`);
|
|
112
|
-
return { ok: false, reason: 'Path matches abuse pattern', code: 'PATH_DENIED' };
|
|
113
|
-
}
|
|
114
|
-
|
|
115
|
-
const count = _hit(actor);
|
|
116
|
-
if (count > RATE_MAX) {
|
|
117
|
-
_audit(actor, rawUrl, 'rate_limited', `count:${count}`);
|
|
118
|
-
return { ok: false, reason: `Rate limit exceeded (${RATE_MAX} URLs/min per actor)`, code: 'RATE_LIMITED' };
|
|
119
|
-
}
|
|
120
|
-
|
|
121
|
-
_audit(actor, rawUrl, 'allowed', null);
|
|
122
|
-
return { ok: true, parsed };
|
|
123
|
-
}
|
|
124
|
-
|
|
125
|
-
function getRecentAudits(limit = 100, decision) {
|
|
126
|
-
if (decision) {
|
|
127
|
-
return db.prepare(`SELECT * FROM url_policy_audit WHERE decision = ? ORDER BY rowid DESC LIMIT ?`).all(decision, limit);
|
|
128
|
-
}
|
|
129
|
-
return db.prepare(`SELECT * FROM url_policy_audit ORDER BY rowid DESC LIMIT ?`).all(limit);
|
|
130
|
-
}
|
|
131
|
-
|
|
132
|
-
function actorFromReq(req) {
|
|
133
|
-
return (req.wabAuth && req.wabAuth.key_id) ||
|
|
134
|
-
(req.user && req.user.id) ||
|
|
135
|
-
req.ip ||
|
|
136
|
-
'anon';
|
|
137
|
-
}
|
|
138
|
-
|
|
139
|
-
module.exports = { check, getRecentAudits, actorFromReq, RATE_MAX };
|
|
1
|
+
'use strict';
|
|
2
|
+
|
|
3
|
+
/**
|
|
4
|
+
* URL Policy — guards public endpoints (e.g. /api/universal/extract) that
|
|
5
|
+
* accept arbitrary user URLs. Layered on top of the SSRF guard in
|
|
6
|
+
* server/utils/safe-fetch.js, this module enforces:
|
|
7
|
+
*
|
|
8
|
+
* 1. Scheme allow-list (https only by default).
|
|
9
|
+
* 2. TLD/host denylist (configurable via WAB_URL_DENY_HOSTS / DEFAULT_DENY).
|
|
10
|
+
* 3. Path denylist for obvious admin/credential/wp-login style targets that
|
|
11
|
+
* would suggest abuse.
|
|
12
|
+
* 4. Per-actor (IP / API-key / siteId) rate-limit independent of express
|
|
13
|
+
* router-level rate limiting.
|
|
14
|
+
*
|
|
15
|
+
* Decisions are recorded in `url_policy_audit` for review.
|
|
16
|
+
*/
|
|
17
|
+
|
|
18
|
+
const crypto = require('crypto');
|
|
19
|
+
const { db } = require('../models/db');
|
|
20
|
+
|
|
21
|
+
const DEFAULT_DENY_HOSTS = [
|
|
22
|
+
// Local/private/metadata is already blocked by safe-fetch; these are
|
|
23
|
+
// additional public hosts that have no legitimate scraping use case.
|
|
24
|
+
'login.microsoftonline.com',
|
|
25
|
+
'accounts.google.com',
|
|
26
|
+
'appleid.apple.com',
|
|
27
|
+
];
|
|
28
|
+
|
|
29
|
+
const DEFAULT_DENY_PATH_RE = /\/(?:wp-(?:login|admin)|administrator|phpmyadmin|\.git|\.env)(?:\/|\.|$|\?)/i;
|
|
30
|
+
|
|
31
|
+
const RATE_WINDOW_MS = 60_000;
|
|
32
|
+
const RATE_MAX = parseInt(process.env.WAB_URL_POLICY_RATE_MAX || '30', 10);
|
|
33
|
+
|
|
34
|
+
function _envHosts() {
|
|
35
|
+
return String(process.env.WAB_URL_DENY_HOSTS || '')
|
|
36
|
+
.split(',').map((s) => s.trim().toLowerCase()).filter(Boolean);
|
|
37
|
+
}
|
|
38
|
+
|
|
39
|
+
db.exec(`
|
|
40
|
+
CREATE TABLE IF NOT EXISTS url_policy_audit (
|
|
41
|
+
id TEXT PRIMARY KEY,
|
|
42
|
+
actor TEXT,
|
|
43
|
+
url TEXT,
|
|
44
|
+
decision TEXT NOT NULL CHECK(decision IN ('allowed','blocked','rate_limited')),
|
|
45
|
+
reason TEXT,
|
|
46
|
+
created_at TEXT DEFAULT (datetime('now'))
|
|
47
|
+
);
|
|
48
|
+
CREATE INDEX IF NOT EXISTS idx_urlpolicy_decision ON url_policy_audit(decision);
|
|
49
|
+
`);
|
|
50
|
+
|
|
51
|
+
const _rate = new Map(); // actor → [ts]
|
|
52
|
+
|
|
53
|
+
function _hit(actor) {
|
|
54
|
+
const now = Date.now();
|
|
55
|
+
const arr = (_rate.get(actor) || []).filter((t) => now - t < RATE_WINDOW_MS);
|
|
56
|
+
arr.push(now);
|
|
57
|
+
_rate.set(actor, arr);
|
|
58
|
+
return arr.length;
|
|
59
|
+
}
|
|
60
|
+
|
|
61
|
+
function _audit(actor, url, decision, reason) {
|
|
62
|
+
try {
|
|
63
|
+
db.prepare(`INSERT INTO url_policy_audit (id, actor, url, decision, reason)
|
|
64
|
+
VALUES (?, ?, ?, ?, ?)`).run(
|
|
65
|
+
crypto.randomUUID(), actor || null, url || null, decision, reason || null);
|
|
66
|
+
} catch (_) { /* never block on audit failure */ }
|
|
67
|
+
}
|
|
68
|
+
|
|
69
|
+
/**
|
|
70
|
+
* @param {string} rawUrl
|
|
71
|
+
* @param {object} opts
|
|
72
|
+
* @param {string} [opts.actor] - IP, API key id, or site id
|
|
73
|
+
* @returns {{ ok:boolean, reason?:string, code?:string, parsed?:URL }}
|
|
74
|
+
*/
|
|
75
|
+
function check(rawUrl, opts = {}) {
|
|
76
|
+
const actor = opts.actor || 'anon';
|
|
77
|
+
|
|
78
|
+
if (typeof rawUrl !== 'string' || rawUrl.length === 0) {
|
|
79
|
+
_audit(actor, String(rawUrl).slice(0, 200), 'blocked', 'missing_url');
|
|
80
|
+
return { ok: false, reason: 'URL is required', code: 'MISSING_URL' };
|
|
81
|
+
}
|
|
82
|
+
if (rawUrl.length > 2048) {
|
|
83
|
+
_audit(actor, rawUrl.slice(0, 200), 'blocked', 'url_too_long');
|
|
84
|
+
return { ok: false, reason: 'URL exceeds 2048 characters', code: 'URL_TOO_LONG' };
|
|
85
|
+
}
|
|
86
|
+
|
|
87
|
+
let parsed;
|
|
88
|
+
try { parsed = new URL(rawUrl); }
|
|
89
|
+
catch {
|
|
90
|
+
_audit(actor, rawUrl.slice(0, 200), 'blocked', 'invalid_url');
|
|
91
|
+
return { ok: false, reason: 'Invalid URL', code: 'INVALID_URL' };
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
if (parsed.protocol !== 'https:' && parsed.protocol !== 'http:') {
|
|
95
|
+
_audit(actor, rawUrl, 'blocked', `scheme:${parsed.protocol}`);
|
|
96
|
+
return { ok: false, reason: `Scheme ${parsed.protocol} not allowed`, code: 'BAD_SCHEME' };
|
|
97
|
+
}
|
|
98
|
+
if (process.env.WAB_URL_POLICY_HTTPS_ONLY === '1' && parsed.protocol !== 'https:') {
|
|
99
|
+
_audit(actor, rawUrl, 'blocked', 'http_disallowed');
|
|
100
|
+
return { ok: false, reason: 'HTTPS required', code: 'HTTPS_REQUIRED' };
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
const host = parsed.hostname.toLowerCase();
|
|
104
|
+
const deny = new Set([...DEFAULT_DENY_HOSTS, ..._envHosts()]);
|
|
105
|
+
if (deny.has(host)) {
|
|
106
|
+
_audit(actor, rawUrl, 'blocked', `host_denied:${host}`);
|
|
107
|
+
return { ok: false, reason: `Host ${host} is denied by policy`, code: 'HOST_DENIED' };
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
if (DEFAULT_DENY_PATH_RE.test(parsed.pathname)) {
|
|
111
|
+
_audit(actor, rawUrl, 'blocked', `path_denied:${parsed.pathname}`);
|
|
112
|
+
return { ok: false, reason: 'Path matches abuse pattern', code: 'PATH_DENIED' };
|
|
113
|
+
}
|
|
114
|
+
|
|
115
|
+
const count = _hit(actor);
|
|
116
|
+
if (count > RATE_MAX) {
|
|
117
|
+
_audit(actor, rawUrl, 'rate_limited', `count:${count}`);
|
|
118
|
+
return { ok: false, reason: `Rate limit exceeded (${RATE_MAX} URLs/min per actor)`, code: 'RATE_LIMITED' };
|
|
119
|
+
}
|
|
120
|
+
|
|
121
|
+
_audit(actor, rawUrl, 'allowed', null);
|
|
122
|
+
return { ok: true, parsed };
|
|
123
|
+
}
|
|
124
|
+
|
|
125
|
+
function getRecentAudits(limit = 100, decision) {
|
|
126
|
+
if (decision) {
|
|
127
|
+
return db.prepare(`SELECT * FROM url_policy_audit WHERE decision = ? ORDER BY rowid DESC LIMIT ?`).all(decision, limit);
|
|
128
|
+
}
|
|
129
|
+
return db.prepare(`SELECT * FROM url_policy_audit ORDER BY rowid DESC LIMIT ?`).all(limit);
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
function actorFromReq(req) {
|
|
133
|
+
return (req.wabAuth && req.wabAuth.key_id) ||
|
|
134
|
+
(req.user && req.user.id) ||
|
|
135
|
+
req.ip ||
|
|
136
|
+
'anon';
|
|
137
|
+
}
|
|
138
|
+
|
|
139
|
+
module.exports = { check, getRecentAudits, actorFromReq, RATE_MAX };
|
|
@@ -0,0 +1,182 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Adoption Agent — turns a bare URL into a ready-to-publish wab.json + DNS TXT.
|
|
3
|
+
*
|
|
4
|
+
* Heuristic-driven (no LLM required). Steps:
|
|
5
|
+
* 1) Run sdk/auto-discovery.discover() to extract metadata.
|
|
6
|
+
* 2) Inspect TLS fingerprint (best effort).
|
|
7
|
+
* 3) Build a draft wab.json (unsigned) from observed signals.
|
|
8
|
+
* 4) Build a draft DNS TXT record.
|
|
9
|
+
* 5) Provide deploy snippets for Cloudflare Worker, Vercel, Netlify, Next.js.
|
|
10
|
+
*
|
|
11
|
+
* Pure server-side, used by /api/adopt and bin/wab-init.js (--auto-from).
|
|
12
|
+
*/
|
|
13
|
+
|
|
14
|
+
'use strict';
|
|
15
|
+
|
|
16
|
+
const { discover } = require('../../sdk/auto-discovery');
|
|
17
|
+
const tls = require('node:tls');
|
|
18
|
+
|
|
19
|
+
function _tlsFingerprint(host, timeoutMs = 6000) {
|
|
20
|
+
return new Promise((resolve) => {
|
|
21
|
+
const sock = tls.connect({ host, port: 443, servername: host, rejectUnauthorized: false }, () => {
|
|
22
|
+
const cert = sock.getPeerCertificate(false);
|
|
23
|
+
sock.end();
|
|
24
|
+
const fp = (cert && cert.fingerprint256 || '').replace(/:/g, '').toLowerCase();
|
|
25
|
+
resolve({ fp: fp || null, valid_to: cert && cert.valid_to });
|
|
26
|
+
});
|
|
27
|
+
sock.on('error', () => resolve({ fp: null }));
|
|
28
|
+
sock.setTimeout(timeoutMs, () => { sock.destroy(); resolve({ fp: null }); });
|
|
29
|
+
});
|
|
30
|
+
}
|
|
31
|
+
|
|
32
|
+
function _detectStackFromEnv(env) {
|
|
33
|
+
const out = { type: 'static', signals: [] };
|
|
34
|
+
if (env.meta && env.meta.og && env.meta.og.site_name) out.signals.push('opengraph');
|
|
35
|
+
if (env.products && env.products.length) out.signals.push('schema.org/Product');
|
|
36
|
+
if (env.sitemap && env.sitemap.length) out.signals.push('sitemap.xml');
|
|
37
|
+
|
|
38
|
+
// Server header probing is too slow; rely on URL/sitemap heuristics.
|
|
39
|
+
const allUrls = (env.sitemap || []).join(' ');
|
|
40
|
+
if (/\?p=\d+|wp-content|wp-json/i.test(allUrls)) out.type = 'wordpress';
|
|
41
|
+
else if (/\/_next\/|\/__next/.test(allUrls)) out.type = 'nextjs';
|
|
42
|
+
else if (env.products && env.products.length > 5) out.type = 'ecommerce';
|
|
43
|
+
return out;
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
function _suggestActions(env, baseUrl) {
|
|
47
|
+
const out = [
|
|
48
|
+
{ name: 'home', description: 'Open homepage', url: baseUrl }
|
|
49
|
+
];
|
|
50
|
+
if (env.actions && Array.isArray(env.actions)) {
|
|
51
|
+
for (const a of env.actions) {
|
|
52
|
+
if (out.find((x) => x.name === a.name)) continue;
|
|
53
|
+
out.push(a);
|
|
54
|
+
}
|
|
55
|
+
}
|
|
56
|
+
if (env.products && env.products.length) {
|
|
57
|
+
out.push({ name: 'browseProducts', description: `${env.products.length} schema.org products discovered`, source: 'schema.org' });
|
|
58
|
+
}
|
|
59
|
+
if (env.sitemap && env.sitemap.length) {
|
|
60
|
+
out.push({ name: 'browseSitemap', description: `${env.sitemap.length} URLs from sitemap.xml`, url: `${baseUrl}/sitemap.xml` });
|
|
61
|
+
}
|
|
62
|
+
if (env.meta && env.meta.og && env.meta.og.url) {
|
|
63
|
+
out.push({ name: 'getOpenGraph', description: 'OpenGraph metadata available', source: 'opengraph' });
|
|
64
|
+
}
|
|
65
|
+
return out.slice(0, 12);
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
function _dnsTxt(host, baseUrl, fingerprint) {
|
|
69
|
+
let v = `v=wab1; endpoint=${baseUrl}/.well-known/wab.json`;
|
|
70
|
+
if (fingerprint) v += `; ssl_thumbprint=${fingerprint}`;
|
|
71
|
+
return { name: `_wab.${host}`, type: 'TXT', value: v };
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
function _deploySnippets(host, baseUrl, doc) {
|
|
75
|
+
const docInline = JSON.stringify(doc, null, 2);
|
|
76
|
+
return {
|
|
77
|
+
static: {
|
|
78
|
+
title: 'Static / Apache / nginx',
|
|
79
|
+
instructions: `Save the wab.json below to:\n <docroot>/.well-known/wab.json\n\nMake sure it is publicly reachable at:\n ${baseUrl}/.well-known/wab.json`
|
|
80
|
+
},
|
|
81
|
+
cloudflare_worker: {
|
|
82
|
+
title: '@webagentbridge/cloudflare-worker',
|
|
83
|
+
install: 'npm i -g wrangler && npm i @webagentbridge/cloudflare-worker',
|
|
84
|
+
env: {
|
|
85
|
+
WAB_SITE_NAME: doc.site,
|
|
86
|
+
WAB_SITE_URL: baseUrl,
|
|
87
|
+
WAB_ACTIONS_JSON: JSON.stringify(doc.actions || [])
|
|
88
|
+
},
|
|
89
|
+
command: 'wrangler deploy'
|
|
90
|
+
},
|
|
91
|
+
vercel: {
|
|
92
|
+
title: '@webagentbridge/edge (Vercel Middleware)',
|
|
93
|
+
install: 'npm i @webagentbridge/edge',
|
|
94
|
+
file: 'middleware.ts',
|
|
95
|
+
content: `import { handleRequest } from '@webagentbridge/edge';
|
|
96
|
+
export const config = { matcher: ['/.well-known/wab.json', '/.well-known/wab-discovery'] };
|
|
97
|
+
export default (req) => handleRequest(req, ${JSON.stringify({ siteName: doc.site, siteUrl: baseUrl, actions: doc.actions || [] }, null, 2)});`
|
|
98
|
+
},
|
|
99
|
+
netlify: {
|
|
100
|
+
title: '@webagentbridge/edge (Netlify Edge Function)',
|
|
101
|
+
install: 'npm i @webagentbridge/edge',
|
|
102
|
+
file: 'netlify/edge-functions/wab.js',
|
|
103
|
+
toml: `[[edge_functions]]\nfunction = "wab"\npath = "/.well-known/wab.json"\n\n[[edge_functions]]\nfunction = "wab"\npath = "/.well-known/wab-discovery"`,
|
|
104
|
+
content: `import { handleRequest } from '@webagentbridge/edge';
|
|
105
|
+
export default (request, ctx) => handleRequest(request, {
|
|
106
|
+
siteName: ${JSON.stringify(doc.site)},
|
|
107
|
+
siteUrl: ${JSON.stringify(baseUrl)},
|
|
108
|
+
actions: ${JSON.stringify(doc.actions || [])}
|
|
109
|
+
});`
|
|
110
|
+
},
|
|
111
|
+
nextjs: {
|
|
112
|
+
title: '@webagentbridge/next',
|
|
113
|
+
install: 'npm i @webagentbridge/next',
|
|
114
|
+
file: 'next.config.js',
|
|
115
|
+
content: `const { withWAB } = require('@webagentbridge/next');
|
|
116
|
+
module.exports = withWAB({}, {
|
|
117
|
+
siteName: ${JSON.stringify(doc.site)},
|
|
118
|
+
siteUrl: ${JSON.stringify(baseUrl)},
|
|
119
|
+
actions: ${JSON.stringify(doc.actions || [], null, 2)},
|
|
120
|
+
});`
|
|
121
|
+
},
|
|
122
|
+
inline_wab_json: docInline
|
|
123
|
+
};
|
|
124
|
+
}
|
|
125
|
+
|
|
126
|
+
/**
|
|
127
|
+
* Suggest a complete adoption package for a URL.
|
|
128
|
+
*
|
|
129
|
+
* @param {string} siteUrl
|
|
130
|
+
* @param {object} [opts]
|
|
131
|
+
* @param {boolean} [opts.includeTls=true]
|
|
132
|
+
* @returns {Promise<{ok:boolean, host:string, base_url:string, stack:object, wab_json:object, dns_txt:object, ssl?:object, deploy:object, env:object}>}
|
|
133
|
+
*/
|
|
134
|
+
async function suggest(siteUrl, opts = {}) {
|
|
135
|
+
if (!siteUrl) return { ok: false, error: 'missing url' };
|
|
136
|
+
if (!/^https?:\/\//i.test(siteUrl)) siteUrl = `https://${siteUrl}`;
|
|
137
|
+
let host, baseUrl;
|
|
138
|
+
try {
|
|
139
|
+
const u = new URL(siteUrl);
|
|
140
|
+
host = u.hostname;
|
|
141
|
+
baseUrl = `${u.protocol}//${u.hostname}`;
|
|
142
|
+
} catch {
|
|
143
|
+
return { ok: false, error: 'invalid url' };
|
|
144
|
+
}
|
|
145
|
+
|
|
146
|
+
const env = await discover(baseUrl, { timeoutMs: opts.timeoutMs || 8000 });
|
|
147
|
+
const stack = _detectStackFromEnv(env);
|
|
148
|
+
const ssl = opts.includeTls === false ? null : await _tlsFingerprint(host);
|
|
149
|
+
|
|
150
|
+
const doc = {
|
|
151
|
+
version: '1.0',
|
|
152
|
+
site: (env.site && env.site.name) || host,
|
|
153
|
+
description: (env.site && env.site.description) || `${host} — generated by Adoption Agent`,
|
|
154
|
+
url: baseUrl,
|
|
155
|
+
project_type: stack.type,
|
|
156
|
+
detected_signals: stack.signals,
|
|
157
|
+
generated_at: new Date().toISOString(),
|
|
158
|
+
generator: 'wab-adoption-agent',
|
|
159
|
+
actions: _suggestActions(env, baseUrl),
|
|
160
|
+
trust: { signed: false, note: 'Run scripts/sign-wab-domain.js to add an Ed25519 signature.' }
|
|
161
|
+
};
|
|
162
|
+
|
|
163
|
+
return {
|
|
164
|
+
ok: true,
|
|
165
|
+
host,
|
|
166
|
+
base_url: baseUrl,
|
|
167
|
+
stack,
|
|
168
|
+
ssl: ssl && ssl.fp ? { fingerprint_sha256: ssl.fp, valid_to: ssl.valid_to } : null,
|
|
169
|
+
wab_json: doc,
|
|
170
|
+
dns_txt: _dnsTxt(host, baseUrl, ssl && ssl.fp),
|
|
171
|
+
deploy: _deploySnippets(host, baseUrl, doc),
|
|
172
|
+
env_summary: {
|
|
173
|
+
source: env.source,
|
|
174
|
+
action_count: doc.actions.length,
|
|
175
|
+
sitemap_count: env.sitemap ? env.sitemap.length : 0,
|
|
176
|
+
product_count: env.products ? env.products.length : 0,
|
|
177
|
+
has_signed_wab: env.source === 'wab.json'
|
|
178
|
+
}
|
|
179
|
+
};
|
|
180
|
+
}
|
|
181
|
+
|
|
182
|
+
module.exports = { suggest };
|