web-agent-bridge 3.3.0 → 3.8.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (312) hide show
  1. package/LICENSE +84 -72
  2. package/README.ar.md +1563 -1286
  3. package/README.md +137 -1764
  4. package/bin/agent-runner.js +474 -474
  5. package/bin/cli.js +237 -237
  6. package/bin/wab-init.js +244 -0
  7. package/bin/wab.js +80 -80
  8. package/examples/azure-dns-wab.js +83 -0
  9. package/examples/bidi-agent.js +119 -119
  10. package/examples/cloudflare-wab-dns.js +121 -0
  11. package/examples/cpanel-wab-dns.js +114 -0
  12. package/examples/cross-site-agent.js +91 -91
  13. package/examples/dns-discovery-agent.js +166 -0
  14. package/examples/gcp-dns-wab.js +76 -0
  15. package/examples/governance-agent.js +169 -0
  16. package/examples/mcp-agent.js +94 -94
  17. package/examples/next-app-router/README.md +44 -44
  18. package/examples/plesk-wab-dns.js +103 -0
  19. package/examples/puppeteer-agent.js +108 -108
  20. package/examples/route53-wab-dns.js +144 -0
  21. package/examples/saas-dashboard/README.md +55 -55
  22. package/examples/safe-mode-agent.js +96 -0
  23. package/examples/self-discovery.js +106 -0
  24. package/examples/shopify-hydrogen/README.md +74 -74
  25. package/examples/vision-agent.js +171 -171
  26. package/examples/wab-sign.js +74 -0
  27. package/examples/wab-verify.js +60 -0
  28. package/examples/wordpress-elementor/README.md +77 -77
  29. package/package.json +93 -93
  30. package/public/.well-known/agent-tools.json +180 -180
  31. package/public/.well-known/ai-assets.json +59 -59
  32. package/public/.well-known/security.txt +8 -8
  33. package/public/.well-known/wab.json +28 -0
  34. package/public/activate.html +448 -0
  35. package/public/adopt.html +236 -0
  36. package/public/adoption-metrics.html +188 -0
  37. package/public/agent-workspace.html +359 -349
  38. package/public/ai.html +198 -198
  39. package/public/api.html +397 -413
  40. package/public/azure-dns-integration.html +289 -0
  41. package/public/browser.html +486 -486
  42. package/public/cloudflare-integration.html +380 -0
  43. package/public/commander-dashboard.html +243 -243
  44. package/public/cookies.html +210 -210
  45. package/public/cpanel-integration.html +398 -0
  46. package/public/css/agent-workspace.css +1713 -1713
  47. package/public/css/premium.css +317 -317
  48. package/public/css/styles.css +1401 -1235
  49. package/public/dashboard-shieldlink.html +295 -0
  50. package/public/dashboard.html +711 -706
  51. package/public/dns.html +436 -507
  52. package/public/docs.html +588 -587
  53. package/public/enterprise-mesh.ar.html +80 -0
  54. package/public/enterprise-mesh.html +81 -0
  55. package/public/feed.xml +89 -89
  56. package/public/gcp-dns-integration.html +318 -0
  57. package/public/governance.ar.html +70 -0
  58. package/public/governance.html +69 -0
  59. package/public/growth.html +465 -463
  60. package/public/index.html +1372 -1070
  61. package/public/integrations.html +556 -556
  62. package/public/js/activate.js +449 -0
  63. package/public/js/agent-workspace.js +1740 -1740
  64. package/public/js/auth-nav.js +117 -31
  65. package/public/js/auth-redirect.js +12 -12
  66. package/public/js/cookie-consent.js +56 -56
  67. package/public/js/dns.js +438 -0
  68. package/public/js/wab-demo-page.js +721 -721
  69. package/public/js/ws-client.js +74 -74
  70. package/public/l-preview.html +242 -0
  71. package/public/llms-full.txt +360 -360
  72. package/public/llms.txt +125 -125
  73. package/public/login.html +85 -85
  74. package/public/mesh-dashboard.html +328 -328
  75. package/public/milestones.html +346 -0
  76. package/public/one-click.html +779 -0
  77. package/public/openapi.json +669 -580
  78. package/public/partners.ar.html +145 -0
  79. package/public/partners.html +143 -0
  80. package/public/phone-shield.html +281 -281
  81. package/public/plesk-integration.html +375 -0
  82. package/public/premium-dashboard.html +2489 -2489
  83. package/public/premium.html +793 -793
  84. package/public/privacy.html +297 -297
  85. package/public/provider-onboarding.html +172 -0
  86. package/public/provider-sandbox.html +134 -0
  87. package/public/providers.html +359 -0
  88. package/public/refusals.html +172 -0
  89. package/public/register.html +105 -105
  90. package/public/registrar-integrations.html +141 -0
  91. package/public/ring4.html +292 -0
  92. package/public/robots.txt +99 -87
  93. package/public/route53-integration.html +531 -0
  94. package/public/score.html +263 -0
  95. package/public/script/wab-consent.d.ts +36 -36
  96. package/public/script/wab-consent.js +104 -104
  97. package/public/script/wab-schema.js +131 -131
  98. package/public/script/wab.d.ts +108 -108
  99. package/public/script/wab.min.js +580 -580
  100. package/public/security.txt +8 -8
  101. package/public/shieldlink.html +244 -0
  102. package/public/shieldqr.html +231 -0
  103. package/public/sitemap.xml +19 -1
  104. package/public/terms.html +256 -256
  105. package/public/trust-graph-api.ar.html +92 -0
  106. package/public/trust-graph-api.html +91 -0
  107. package/public/wab-features.html +560 -0
  108. package/public/wab-trust.html +200 -0
  109. package/public/wab-truth.html +375 -0
  110. package/public/wab-vs-protocols.html +210 -0
  111. package/public/whitepaper.html +449 -0
  112. package/script/ai-agent-bridge.js +1754 -1754
  113. package/sdk/README.md +99 -99
  114. package/sdk/agent-mesh.js +449 -449
  115. package/sdk/auto-discovery.js +301 -0
  116. package/sdk/commander.js +262 -262
  117. package/sdk/governance.js +262 -0
  118. package/sdk/index.d.ts +464 -464
  119. package/sdk/index.js +649 -636
  120. package/sdk/multi-agent.js +318 -318
  121. package/sdk/package.json +2 -2
  122. package/sdk/safe-mode.js +221 -0
  123. package/sdk/safety-shield.js +219 -219
  124. package/sdk/schema-discovery.js +83 -83
  125. package/server/adapters/index.js +520 -520
  126. package/server/config/plans.js +412 -367
  127. package/server/config/secrets.js +102 -102
  128. package/server/control-plane/index.js +301 -301
  129. package/server/data-plane/index.js +354 -354
  130. package/server/index.js +790 -531
  131. package/server/llm/index.js +404 -404
  132. package/server/middleware/adminAuth.js +35 -35
  133. package/server/middleware/api-tier.js +170 -0
  134. package/server/middleware/auth.js +50 -50
  135. package/server/middleware/featureGate.js +88 -88
  136. package/server/middleware/rateLimits.js +100 -100
  137. package/server/middleware/sensitiveAction.js +157 -157
  138. package/server/middleware/wab-trust.js +141 -0
  139. package/server/migrations/001_add_analytics_indexes.sql +7 -7
  140. package/server/migrations/002_premium_features.sql +418 -418
  141. package/server/migrations/003_ads_integer_cents.sql +33 -33
  142. package/server/migrations/004_agent_os.sql +158 -158
  143. package/server/migrations/005_marketplace_metering.sql +126 -126
  144. package/server/migrations/006_growth_suite.sql +138 -0
  145. package/server/migrations/007_governance.sql +106 -0
  146. package/server/migrations/008_plans.sql +144 -0
  147. package/server/migrations/009_shieldqr.sql +30 -0
  148. package/server/migrations/010_extended_trust.sql +33 -0
  149. package/server/migrations/011_outreach.sql +47 -0
  150. package/server/migrations/012_shieldlink.sql +116 -0
  151. package/server/migrations/013_ct_monitor.sql +13 -0
  152. package/server/migrations/014_wab_advanced_features.sql +128 -0
  153. package/server/migrations/015_wab_truth_layer.sql +101 -0
  154. package/server/migrations/016_ring4_external_trust.sql +84 -0
  155. package/server/migrations/017_ring4_extensions.sql +69 -0
  156. package/server/migrations/018_commercial_foundations.sql +167 -0
  157. package/server/migrations/019_unify_tier_constraints.sql +133 -0
  158. package/server/models/adapters/index.js +33 -33
  159. package/server/models/adapters/mysql.js +183 -183
  160. package/server/models/adapters/postgresql.js +172 -172
  161. package/server/models/adapters/sqlite.js +7 -7
  162. package/server/models/db.js +740 -681
  163. package/server/observability/failure-analysis.js +337 -337
  164. package/server/observability/index.js +394 -394
  165. package/server/protocol/capabilities.js +223 -223
  166. package/server/protocol/index.js +243 -243
  167. package/server/protocol/schema.js +584 -584
  168. package/server/registry/certification.js +271 -271
  169. package/server/registry/index.js +326 -326
  170. package/server/routes/activate.js +478 -0
  171. package/server/routes/admin-outreach.js +239 -0
  172. package/server/routes/admin-plans.js +76 -0
  173. package/server/routes/admin-premium.js +674 -671
  174. package/server/routes/admin-shieldlink.js +137 -0
  175. package/server/routes/admin-shieldqr.js +90 -0
  176. package/server/routes/admin-trust-monitor.js +139 -0
  177. package/server/routes/admin.js +550 -261
  178. package/server/routes/adopt.js +61 -0
  179. package/server/routes/ads.js +130 -130
  180. package/server/routes/agent-workspace.js +540 -540
  181. package/server/routes/api-keys.js +127 -0
  182. package/server/routes/api.js +150 -150
  183. package/server/routes/auth.js +71 -71
  184. package/server/routes/billing.js +57 -45
  185. package/server/routes/commander.js +316 -316
  186. package/server/routes/customer-shieldlink.js +133 -0
  187. package/server/routes/demo-showcase.js +332 -332
  188. package/server/routes/demo-store.js +154 -154
  189. package/server/routes/diagnose.js +373 -0
  190. package/server/routes/discovery.js +2348 -417
  191. package/server/routes/enterprise-mesh.js +170 -0
  192. package/server/routes/gateway.js +173 -173
  193. package/server/routes/governance-saas.js +203 -0
  194. package/server/routes/governance.js +208 -0
  195. package/server/routes/growth.js +1048 -0
  196. package/server/routes/intent.js +328 -0
  197. package/server/routes/license.js +251 -251
  198. package/server/routes/mesh.js +469 -469
  199. package/server/routes/noscript.js +543 -543
  200. package/server/routes/partners.js +201 -0
  201. package/server/routes/plans.js +33 -0
  202. package/server/routes/premium-v2.js +686 -686
  203. package/server/routes/premium.js +724 -724
  204. package/server/routes/providers.js +650 -0
  205. package/server/routes/reputation.js +411 -0
  206. package/server/routes/ring4.js +885 -0
  207. package/server/routes/runtime.js +2148 -2148
  208. package/server/routes/shieldlink.js +70 -0
  209. package/server/routes/shieldqr.js +88 -0
  210. package/server/routes/sovereign.js +465 -465
  211. package/server/routes/truth-layer.js +670 -0
  212. package/server/routes/universal.js +200 -200
  213. package/server/routes/unsubscribe.js +51 -0
  214. package/server/routes/wab-api.js +850 -850
  215. package/server/routes/wab-cache.js +282 -0
  216. package/server/runtime/container-worker.js +111 -111
  217. package/server/runtime/container.js +448 -448
  218. package/server/runtime/distributed-worker.js +362 -362
  219. package/server/runtime/event-bus.js +210 -210
  220. package/server/runtime/index.js +253 -253
  221. package/server/runtime/queue.js +599 -599
  222. package/server/runtime/replay.js +666 -666
  223. package/server/runtime/sandbox.js +266 -266
  224. package/server/runtime/scheduler.js +534 -534
  225. package/server/runtime/session-engine.js +293 -293
  226. package/server/runtime/state-manager.js +188 -188
  227. package/server/secrets/wab-signing-key.pem +3 -0
  228. package/server/secrets/wab-signing-pub.pem +3 -0
  229. package/server/security/cross-site-redactor.js +196 -196
  230. package/server/security/dry-run.js +180 -180
  231. package/server/security/human-gate-rate-limit.js +147 -147
  232. package/server/security/human-gate-transports.js +178 -178
  233. package/server/security/human-gate.js +281 -281
  234. package/server/security/index.js +368 -368
  235. package/server/security/intent-engine.js +245 -245
  236. package/server/security/reward-guard.js +171 -171
  237. package/server/security/rollback-store.js +239 -239
  238. package/server/security/token-scope.js +404 -404
  239. package/server/security/url-policy.js +139 -139
  240. package/server/services/adoption-agent.js +182 -0
  241. package/server/services/agent-chat.js +506 -506
  242. package/server/services/agent-learning.js +601 -601
  243. package/server/services/agent-memory.js +625 -625
  244. package/server/services/agent-mesh.js +555 -555
  245. package/server/services/agent-symphony.js +717 -717
  246. package/server/services/agent-tasks.js +1807 -1807
  247. package/server/services/api-key-engine.js +292 -292
  248. package/server/services/cluster.js +894 -894
  249. package/server/services/commander.js +738 -738
  250. package/server/services/edge-compute.js +440 -440
  251. package/server/services/email.js +233 -204
  252. package/server/services/fairness-engine.js +409 -0
  253. package/server/services/fairness.js +420 -0
  254. package/server/services/governance.js +466 -0
  255. package/server/services/hosted-runtime.js +205 -205
  256. package/server/services/lfd.js +635 -635
  257. package/server/services/local-ai.js +389 -389
  258. package/server/services/marketplace.js +270 -270
  259. package/server/services/metering.js +182 -182
  260. package/server/services/modules/affiliate-intelligence.js +93 -93
  261. package/server/services/modules/agent-firewall.js +90 -90
  262. package/server/services/modules/bounty.js +89 -89
  263. package/server/services/modules/collective-bargaining.js +92 -92
  264. package/server/services/modules/dark-pattern.js +66 -66
  265. package/server/services/modules/gov-intelligence.js +45 -45
  266. package/server/services/modules/neural.js +55 -55
  267. package/server/services/modules/notary.js +49 -49
  268. package/server/services/modules/price-time-machine.js +86 -86
  269. package/server/services/modules/protocol.js +104 -104
  270. package/server/services/negotiation.js +439 -439
  271. package/server/services/outreach-agent.js +312 -0
  272. package/server/services/plans.js +214 -0
  273. package/server/services/plugins.js +771 -771
  274. package/server/services/premium.js +1 -1
  275. package/server/services/price-intelligence.js +566 -566
  276. package/server/services/price-shield.js +1137 -1137
  277. package/server/services/provider-clients.js +740 -0
  278. package/server/services/reputation.js +465 -465
  279. package/server/services/search-engine.js +357 -357
  280. package/server/services/security.js +513 -513
  281. package/server/services/self-healing.js +843 -843
  282. package/server/services/shieldlink.js +492 -0
  283. package/server/services/shieldqr.js +322 -0
  284. package/server/services/sovereign-shield.js +542 -542
  285. package/server/services/ssl-ct-monitor.js +224 -0
  286. package/server/services/ssl-inspector.js +42 -0
  287. package/server/services/ssl-monitor.js +167 -0
  288. package/server/services/stripe.js +206 -192
  289. package/server/services/swarm.js +788 -788
  290. package/server/services/universal-scraper.js +662 -662
  291. package/server/services/verification.js +481 -481
  292. package/server/services/vision.js +1163 -1163
  293. package/server/services/wab-crypto.js +178 -0
  294. package/server/utils/cache.js +125 -125
  295. package/server/utils/migrate.js +81 -81
  296. package/server/utils/safe-fetch.js +228 -228
  297. package/server/utils/secureFields.js +50 -50
  298. package/server/ws.js +161 -161
  299. package/templates/artisan-marketplace.yaml +104 -104
  300. package/templates/book-price-scout.yaml +98 -98
  301. package/templates/electronics-price-tracker.yaml +108 -108
  302. package/templates/flight-deal-hunter.yaml +113 -113
  303. package/templates/freelancer-direct.yaml +116 -116
  304. package/templates/grocery-price-compare.yaml +93 -93
  305. package/templates/hotel-direct-booking.yaml +113 -113
  306. package/templates/local-services.yaml +98 -98
  307. package/templates/olive-oil-tunisia.yaml +88 -88
  308. package/templates/organic-farm-fresh.yaml +101 -101
  309. package/templates/restaurant-direct.yaml +97 -97
  310. package/templates/ring4/banking-sovereign.yaml +55 -0
  311. package/templates/ring4/ecommerce-sovereign.yaml +58 -0
  312. package/templates/ring4/healthcare-sovereign.yaml +60 -0
@@ -1,139 +1,139 @@
1
- 'use strict';
2
-
3
- /**
4
- * URL Policy — guards public endpoints (e.g. /api/universal/extract) that
5
- * accept arbitrary user URLs. Layered on top of the SSRF guard in
6
- * server/utils/safe-fetch.js, this module enforces:
7
- *
8
- * 1. Scheme allow-list (https only by default).
9
- * 2. TLD/host denylist (configurable via WAB_URL_DENY_HOSTS / DEFAULT_DENY).
10
- * 3. Path denylist for obvious admin/credential/wp-login style targets that
11
- * would suggest abuse.
12
- * 4. Per-actor (IP / API-key / siteId) rate-limit independent of express
13
- * router-level rate limiting.
14
- *
15
- * Decisions are recorded in `url_policy_audit` for review.
16
- */
17
-
18
- const crypto = require('crypto');
19
- const { db } = require('../models/db');
20
-
21
- const DEFAULT_DENY_HOSTS = [
22
- // Local/private/metadata is already blocked by safe-fetch; these are
23
- // additional public hosts that have no legitimate scraping use case.
24
- 'login.microsoftonline.com',
25
- 'accounts.google.com',
26
- 'appleid.apple.com',
27
- ];
28
-
29
- const DEFAULT_DENY_PATH_RE = /\/(?:wp-(?:login|admin)|administrator|phpmyadmin|\.git|\.env)(?:\/|\.|$|\?)/i;
30
-
31
- const RATE_WINDOW_MS = 60_000;
32
- const RATE_MAX = parseInt(process.env.WAB_URL_POLICY_RATE_MAX || '30', 10);
33
-
34
- function _envHosts() {
35
- return String(process.env.WAB_URL_DENY_HOSTS || '')
36
- .split(',').map((s) => s.trim().toLowerCase()).filter(Boolean);
37
- }
38
-
39
- db.exec(`
40
- CREATE TABLE IF NOT EXISTS url_policy_audit (
41
- id TEXT PRIMARY KEY,
42
- actor TEXT,
43
- url TEXT,
44
- decision TEXT NOT NULL CHECK(decision IN ('allowed','blocked','rate_limited')),
45
- reason TEXT,
46
- created_at TEXT DEFAULT (datetime('now'))
47
- );
48
- CREATE INDEX IF NOT EXISTS idx_urlpolicy_decision ON url_policy_audit(decision);
49
- `);
50
-
51
- const _rate = new Map(); // actor → [ts]
52
-
53
- function _hit(actor) {
54
- const now = Date.now();
55
- const arr = (_rate.get(actor) || []).filter((t) => now - t < RATE_WINDOW_MS);
56
- arr.push(now);
57
- _rate.set(actor, arr);
58
- return arr.length;
59
- }
60
-
61
- function _audit(actor, url, decision, reason) {
62
- try {
63
- db.prepare(`INSERT INTO url_policy_audit (id, actor, url, decision, reason)
64
- VALUES (?, ?, ?, ?, ?)`).run(
65
- crypto.randomUUID(), actor || null, url || null, decision, reason || null);
66
- } catch (_) { /* never block on audit failure */ }
67
- }
68
-
69
- /**
70
- * @param {string} rawUrl
71
- * @param {object} opts
72
- * @param {string} [opts.actor] - IP, API key id, or site id
73
- * @returns {{ ok:boolean, reason?:string, code?:string, parsed?:URL }}
74
- */
75
- function check(rawUrl, opts = {}) {
76
- const actor = opts.actor || 'anon';
77
-
78
- if (typeof rawUrl !== 'string' || rawUrl.length === 0) {
79
- _audit(actor, String(rawUrl).slice(0, 200), 'blocked', 'missing_url');
80
- return { ok: false, reason: 'URL is required', code: 'MISSING_URL' };
81
- }
82
- if (rawUrl.length > 2048) {
83
- _audit(actor, rawUrl.slice(0, 200), 'blocked', 'url_too_long');
84
- return { ok: false, reason: 'URL exceeds 2048 characters', code: 'URL_TOO_LONG' };
85
- }
86
-
87
- let parsed;
88
- try { parsed = new URL(rawUrl); }
89
- catch {
90
- _audit(actor, rawUrl.slice(0, 200), 'blocked', 'invalid_url');
91
- return { ok: false, reason: 'Invalid URL', code: 'INVALID_URL' };
92
- }
93
-
94
- if (parsed.protocol !== 'https:' && parsed.protocol !== 'http:') {
95
- _audit(actor, rawUrl, 'blocked', `scheme:${parsed.protocol}`);
96
- return { ok: false, reason: `Scheme ${parsed.protocol} not allowed`, code: 'BAD_SCHEME' };
97
- }
98
- if (process.env.WAB_URL_POLICY_HTTPS_ONLY === '1' && parsed.protocol !== 'https:') {
99
- _audit(actor, rawUrl, 'blocked', 'http_disallowed');
100
- return { ok: false, reason: 'HTTPS required', code: 'HTTPS_REQUIRED' };
101
- }
102
-
103
- const host = parsed.hostname.toLowerCase();
104
- const deny = new Set([...DEFAULT_DENY_HOSTS, ..._envHosts()]);
105
- if (deny.has(host)) {
106
- _audit(actor, rawUrl, 'blocked', `host_denied:${host}`);
107
- return { ok: false, reason: `Host ${host} is denied by policy`, code: 'HOST_DENIED' };
108
- }
109
-
110
- if (DEFAULT_DENY_PATH_RE.test(parsed.pathname)) {
111
- _audit(actor, rawUrl, 'blocked', `path_denied:${parsed.pathname}`);
112
- return { ok: false, reason: 'Path matches abuse pattern', code: 'PATH_DENIED' };
113
- }
114
-
115
- const count = _hit(actor);
116
- if (count > RATE_MAX) {
117
- _audit(actor, rawUrl, 'rate_limited', `count:${count}`);
118
- return { ok: false, reason: `Rate limit exceeded (${RATE_MAX} URLs/min per actor)`, code: 'RATE_LIMITED' };
119
- }
120
-
121
- _audit(actor, rawUrl, 'allowed', null);
122
- return { ok: true, parsed };
123
- }
124
-
125
- function getRecentAudits(limit = 100, decision) {
126
- if (decision) {
127
- return db.prepare(`SELECT * FROM url_policy_audit WHERE decision = ? ORDER BY rowid DESC LIMIT ?`).all(decision, limit);
128
- }
129
- return db.prepare(`SELECT * FROM url_policy_audit ORDER BY rowid DESC LIMIT ?`).all(limit);
130
- }
131
-
132
- function actorFromReq(req) {
133
- return (req.wabAuth && req.wabAuth.key_id) ||
134
- (req.user && req.user.id) ||
135
- req.ip ||
136
- 'anon';
137
- }
138
-
139
- module.exports = { check, getRecentAudits, actorFromReq, RATE_MAX };
1
+ 'use strict';
2
+
3
+ /**
4
+ * URL Policy — guards public endpoints (e.g. /api/universal/extract) that
5
+ * accept arbitrary user URLs. Layered on top of the SSRF guard in
6
+ * server/utils/safe-fetch.js, this module enforces:
7
+ *
8
+ * 1. Scheme allow-list (https only by default).
9
+ * 2. TLD/host denylist (configurable via WAB_URL_DENY_HOSTS / DEFAULT_DENY).
10
+ * 3. Path denylist for obvious admin/credential/wp-login style targets that
11
+ * would suggest abuse.
12
+ * 4. Per-actor (IP / API-key / siteId) rate-limit independent of express
13
+ * router-level rate limiting.
14
+ *
15
+ * Decisions are recorded in `url_policy_audit` for review.
16
+ */
17
+
18
+ const crypto = require('crypto');
19
+ const { db } = require('../models/db');
20
+
21
+ const DEFAULT_DENY_HOSTS = [
22
+ // Local/private/metadata is already blocked by safe-fetch; these are
23
+ // additional public hosts that have no legitimate scraping use case.
24
+ 'login.microsoftonline.com',
25
+ 'accounts.google.com',
26
+ 'appleid.apple.com',
27
+ ];
28
+
29
+ const DEFAULT_DENY_PATH_RE = /\/(?:wp-(?:login|admin)|administrator|phpmyadmin|\.git|\.env)(?:\/|\.|$|\?)/i;
30
+
31
+ const RATE_WINDOW_MS = 60_000;
32
+ const RATE_MAX = parseInt(process.env.WAB_URL_POLICY_RATE_MAX || '30', 10);
33
+
34
+ function _envHosts() {
35
+ return String(process.env.WAB_URL_DENY_HOSTS || '')
36
+ .split(',').map((s) => s.trim().toLowerCase()).filter(Boolean);
37
+ }
38
+
39
+ db.exec(`
40
+ CREATE TABLE IF NOT EXISTS url_policy_audit (
41
+ id TEXT PRIMARY KEY,
42
+ actor TEXT,
43
+ url TEXT,
44
+ decision TEXT NOT NULL CHECK(decision IN ('allowed','blocked','rate_limited')),
45
+ reason TEXT,
46
+ created_at TEXT DEFAULT (datetime('now'))
47
+ );
48
+ CREATE INDEX IF NOT EXISTS idx_urlpolicy_decision ON url_policy_audit(decision);
49
+ `);
50
+
51
+ const _rate = new Map(); // actor → [ts]
52
+
53
+ function _hit(actor) {
54
+ const now = Date.now();
55
+ const arr = (_rate.get(actor) || []).filter((t) => now - t < RATE_WINDOW_MS);
56
+ arr.push(now);
57
+ _rate.set(actor, arr);
58
+ return arr.length;
59
+ }
60
+
61
+ function _audit(actor, url, decision, reason) {
62
+ try {
63
+ db.prepare(`INSERT INTO url_policy_audit (id, actor, url, decision, reason)
64
+ VALUES (?, ?, ?, ?, ?)`).run(
65
+ crypto.randomUUID(), actor || null, url || null, decision, reason || null);
66
+ } catch (_) { /* never block on audit failure */ }
67
+ }
68
+
69
+ /**
70
+ * @param {string} rawUrl
71
+ * @param {object} opts
72
+ * @param {string} [opts.actor] - IP, API key id, or site id
73
+ * @returns {{ ok:boolean, reason?:string, code?:string, parsed?:URL }}
74
+ */
75
+ function check(rawUrl, opts = {}) {
76
+ const actor = opts.actor || 'anon';
77
+
78
+ if (typeof rawUrl !== 'string' || rawUrl.length === 0) {
79
+ _audit(actor, String(rawUrl).slice(0, 200), 'blocked', 'missing_url');
80
+ return { ok: false, reason: 'URL is required', code: 'MISSING_URL' };
81
+ }
82
+ if (rawUrl.length > 2048) {
83
+ _audit(actor, rawUrl.slice(0, 200), 'blocked', 'url_too_long');
84
+ return { ok: false, reason: 'URL exceeds 2048 characters', code: 'URL_TOO_LONG' };
85
+ }
86
+
87
+ let parsed;
88
+ try { parsed = new URL(rawUrl); }
89
+ catch {
90
+ _audit(actor, rawUrl.slice(0, 200), 'blocked', 'invalid_url');
91
+ return { ok: false, reason: 'Invalid URL', code: 'INVALID_URL' };
92
+ }
93
+
94
+ if (parsed.protocol !== 'https:' && parsed.protocol !== 'http:') {
95
+ _audit(actor, rawUrl, 'blocked', `scheme:${parsed.protocol}`);
96
+ return { ok: false, reason: `Scheme ${parsed.protocol} not allowed`, code: 'BAD_SCHEME' };
97
+ }
98
+ if (process.env.WAB_URL_POLICY_HTTPS_ONLY === '1' && parsed.protocol !== 'https:') {
99
+ _audit(actor, rawUrl, 'blocked', 'http_disallowed');
100
+ return { ok: false, reason: 'HTTPS required', code: 'HTTPS_REQUIRED' };
101
+ }
102
+
103
+ const host = parsed.hostname.toLowerCase();
104
+ const deny = new Set([...DEFAULT_DENY_HOSTS, ..._envHosts()]);
105
+ if (deny.has(host)) {
106
+ _audit(actor, rawUrl, 'blocked', `host_denied:${host}`);
107
+ return { ok: false, reason: `Host ${host} is denied by policy`, code: 'HOST_DENIED' };
108
+ }
109
+
110
+ if (DEFAULT_DENY_PATH_RE.test(parsed.pathname)) {
111
+ _audit(actor, rawUrl, 'blocked', `path_denied:${parsed.pathname}`);
112
+ return { ok: false, reason: 'Path matches abuse pattern', code: 'PATH_DENIED' };
113
+ }
114
+
115
+ const count = _hit(actor);
116
+ if (count > RATE_MAX) {
117
+ _audit(actor, rawUrl, 'rate_limited', `count:${count}`);
118
+ return { ok: false, reason: `Rate limit exceeded (${RATE_MAX} URLs/min per actor)`, code: 'RATE_LIMITED' };
119
+ }
120
+
121
+ _audit(actor, rawUrl, 'allowed', null);
122
+ return { ok: true, parsed };
123
+ }
124
+
125
+ function getRecentAudits(limit = 100, decision) {
126
+ if (decision) {
127
+ return db.prepare(`SELECT * FROM url_policy_audit WHERE decision = ? ORDER BY rowid DESC LIMIT ?`).all(decision, limit);
128
+ }
129
+ return db.prepare(`SELECT * FROM url_policy_audit ORDER BY rowid DESC LIMIT ?`).all(limit);
130
+ }
131
+
132
+ function actorFromReq(req) {
133
+ return (req.wabAuth && req.wabAuth.key_id) ||
134
+ (req.user && req.user.id) ||
135
+ req.ip ||
136
+ 'anon';
137
+ }
138
+
139
+ module.exports = { check, getRecentAudits, actorFromReq, RATE_MAX };
@@ -0,0 +1,182 @@
1
+ /**
2
+ * Adoption Agent — turns a bare URL into a ready-to-publish wab.json + DNS TXT.
3
+ *
4
+ * Heuristic-driven (no LLM required). Steps:
5
+ * 1) Run sdk/auto-discovery.discover() to extract metadata.
6
+ * 2) Inspect TLS fingerprint (best effort).
7
+ * 3) Build a draft wab.json (unsigned) from observed signals.
8
+ * 4) Build a draft DNS TXT record.
9
+ * 5) Provide deploy snippets for Cloudflare Worker, Vercel, Netlify, Next.js.
10
+ *
11
+ * Pure server-side, used by /api/adopt and bin/wab-init.js (--auto-from).
12
+ */
13
+
14
+ 'use strict';
15
+
16
+ const { discover } = require('../../sdk/auto-discovery');
17
+ const tls = require('node:tls');
18
+
19
+ function _tlsFingerprint(host, timeoutMs = 6000) {
20
+ return new Promise((resolve) => {
21
+ const sock = tls.connect({ host, port: 443, servername: host, rejectUnauthorized: false }, () => {
22
+ const cert = sock.getPeerCertificate(false);
23
+ sock.end();
24
+ const fp = (cert && cert.fingerprint256 || '').replace(/:/g, '').toLowerCase();
25
+ resolve({ fp: fp || null, valid_to: cert && cert.valid_to });
26
+ });
27
+ sock.on('error', () => resolve({ fp: null }));
28
+ sock.setTimeout(timeoutMs, () => { sock.destroy(); resolve({ fp: null }); });
29
+ });
30
+ }
31
+
32
+ function _detectStackFromEnv(env) {
33
+ const out = { type: 'static', signals: [] };
34
+ if (env.meta && env.meta.og && env.meta.og.site_name) out.signals.push('opengraph');
35
+ if (env.products && env.products.length) out.signals.push('schema.org/Product');
36
+ if (env.sitemap && env.sitemap.length) out.signals.push('sitemap.xml');
37
+
38
+ // Server header probing is too slow; rely on URL/sitemap heuristics.
39
+ const allUrls = (env.sitemap || []).join(' ');
40
+ if (/\?p=\d+|wp-content|wp-json/i.test(allUrls)) out.type = 'wordpress';
41
+ else if (/\/_next\/|\/__next/.test(allUrls)) out.type = 'nextjs';
42
+ else if (env.products && env.products.length > 5) out.type = 'ecommerce';
43
+ return out;
44
+ }
45
+
46
+ function _suggestActions(env, baseUrl) {
47
+ const out = [
48
+ { name: 'home', description: 'Open homepage', url: baseUrl }
49
+ ];
50
+ if (env.actions && Array.isArray(env.actions)) {
51
+ for (const a of env.actions) {
52
+ if (out.find((x) => x.name === a.name)) continue;
53
+ out.push(a);
54
+ }
55
+ }
56
+ if (env.products && env.products.length) {
57
+ out.push({ name: 'browseProducts', description: `${env.products.length} schema.org products discovered`, source: 'schema.org' });
58
+ }
59
+ if (env.sitemap && env.sitemap.length) {
60
+ out.push({ name: 'browseSitemap', description: `${env.sitemap.length} URLs from sitemap.xml`, url: `${baseUrl}/sitemap.xml` });
61
+ }
62
+ if (env.meta && env.meta.og && env.meta.og.url) {
63
+ out.push({ name: 'getOpenGraph', description: 'OpenGraph metadata available', source: 'opengraph' });
64
+ }
65
+ return out.slice(0, 12);
66
+ }
67
+
68
+ function _dnsTxt(host, baseUrl, fingerprint) {
69
+ let v = `v=wab1; endpoint=${baseUrl}/.well-known/wab.json`;
70
+ if (fingerprint) v += `; ssl_thumbprint=${fingerprint}`;
71
+ return { name: `_wab.${host}`, type: 'TXT', value: v };
72
+ }
73
+
74
+ function _deploySnippets(host, baseUrl, doc) {
75
+ const docInline = JSON.stringify(doc, null, 2);
76
+ return {
77
+ static: {
78
+ title: 'Static / Apache / nginx',
79
+ instructions: `Save the wab.json below to:\n <docroot>/.well-known/wab.json\n\nMake sure it is publicly reachable at:\n ${baseUrl}/.well-known/wab.json`
80
+ },
81
+ cloudflare_worker: {
82
+ title: '@webagentbridge/cloudflare-worker',
83
+ install: 'npm i -g wrangler && npm i @webagentbridge/cloudflare-worker',
84
+ env: {
85
+ WAB_SITE_NAME: doc.site,
86
+ WAB_SITE_URL: baseUrl,
87
+ WAB_ACTIONS_JSON: JSON.stringify(doc.actions || [])
88
+ },
89
+ command: 'wrangler deploy'
90
+ },
91
+ vercel: {
92
+ title: '@webagentbridge/edge (Vercel Middleware)',
93
+ install: 'npm i @webagentbridge/edge',
94
+ file: 'middleware.ts',
95
+ content: `import { handleRequest } from '@webagentbridge/edge';
96
+ export const config = { matcher: ['/.well-known/wab.json', '/.well-known/wab-discovery'] };
97
+ export default (req) => handleRequest(req, ${JSON.stringify({ siteName: doc.site, siteUrl: baseUrl, actions: doc.actions || [] }, null, 2)});`
98
+ },
99
+ netlify: {
100
+ title: '@webagentbridge/edge (Netlify Edge Function)',
101
+ install: 'npm i @webagentbridge/edge',
102
+ file: 'netlify/edge-functions/wab.js',
103
+ toml: `[[edge_functions]]\nfunction = "wab"\npath = "/.well-known/wab.json"\n\n[[edge_functions]]\nfunction = "wab"\npath = "/.well-known/wab-discovery"`,
104
+ content: `import { handleRequest } from '@webagentbridge/edge';
105
+ export default (request, ctx) => handleRequest(request, {
106
+ siteName: ${JSON.stringify(doc.site)},
107
+ siteUrl: ${JSON.stringify(baseUrl)},
108
+ actions: ${JSON.stringify(doc.actions || [])}
109
+ });`
110
+ },
111
+ nextjs: {
112
+ title: '@webagentbridge/next',
113
+ install: 'npm i @webagentbridge/next',
114
+ file: 'next.config.js',
115
+ content: `const { withWAB } = require('@webagentbridge/next');
116
+ module.exports = withWAB({}, {
117
+ siteName: ${JSON.stringify(doc.site)},
118
+ siteUrl: ${JSON.stringify(baseUrl)},
119
+ actions: ${JSON.stringify(doc.actions || [], null, 2)},
120
+ });`
121
+ },
122
+ inline_wab_json: docInline
123
+ };
124
+ }
125
+
126
+ /**
127
+ * Suggest a complete adoption package for a URL.
128
+ *
129
+ * @param {string} siteUrl
130
+ * @param {object} [opts]
131
+ * @param {boolean} [opts.includeTls=true]
132
+ * @returns {Promise<{ok:boolean, host:string, base_url:string, stack:object, wab_json:object, dns_txt:object, ssl?:object, deploy:object, env:object}>}
133
+ */
134
+ async function suggest(siteUrl, opts = {}) {
135
+ if (!siteUrl) return { ok: false, error: 'missing url' };
136
+ if (!/^https?:\/\//i.test(siteUrl)) siteUrl = `https://${siteUrl}`;
137
+ let host, baseUrl;
138
+ try {
139
+ const u = new URL(siteUrl);
140
+ host = u.hostname;
141
+ baseUrl = `${u.protocol}//${u.hostname}`;
142
+ } catch {
143
+ return { ok: false, error: 'invalid url' };
144
+ }
145
+
146
+ const env = await discover(baseUrl, { timeoutMs: opts.timeoutMs || 8000 });
147
+ const stack = _detectStackFromEnv(env);
148
+ const ssl = opts.includeTls === false ? null : await _tlsFingerprint(host);
149
+
150
+ const doc = {
151
+ version: '1.0',
152
+ site: (env.site && env.site.name) || host,
153
+ description: (env.site && env.site.description) || `${host} — generated by Adoption Agent`,
154
+ url: baseUrl,
155
+ project_type: stack.type,
156
+ detected_signals: stack.signals,
157
+ generated_at: new Date().toISOString(),
158
+ generator: 'wab-adoption-agent',
159
+ actions: _suggestActions(env, baseUrl),
160
+ trust: { signed: false, note: 'Run scripts/sign-wab-domain.js to add an Ed25519 signature.' }
161
+ };
162
+
163
+ return {
164
+ ok: true,
165
+ host,
166
+ base_url: baseUrl,
167
+ stack,
168
+ ssl: ssl && ssl.fp ? { fingerprint_sha256: ssl.fp, valid_to: ssl.valid_to } : null,
169
+ wab_json: doc,
170
+ dns_txt: _dnsTxt(host, baseUrl, ssl && ssl.fp),
171
+ deploy: _deploySnippets(host, baseUrl, doc),
172
+ env_summary: {
173
+ source: env.source,
174
+ action_count: doc.actions.length,
175
+ sitemap_count: env.sitemap ? env.sitemap.length : 0,
176
+ product_count: env.products ? env.products.length : 0,
177
+ has_signed_wab: env.source === 'wab.json'
178
+ }
179
+ };
180
+ }
181
+
182
+ module.exports = { suggest };