npm - @blamejs/core - Versions diffs - 0.8.42 → 0.8.49 - Mend

@blamejs/core 0.8.42 → 0.8.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (222) hide show

package/CHANGELOG.md +93 -0
package/README.md +10 -10
package/index.js +52 -0
package/lib/a2a.js +159 -34
package/lib/acme.js +762 -0
package/lib/ai-pref.js +166 -43
package/lib/api-key.js +108 -47
package/lib/api-snapshot.js +157 -40
package/lib/app-shutdown.js +113 -77
package/lib/archive.js +337 -40
package/lib/arg-parser.js +697 -0
package/lib/asyncapi.js +99 -55
package/lib/atomic-file.js +465 -104
package/lib/audit-chain.js +123 -34
package/lib/audit-daily-review.js +389 -0
package/lib/audit-sign.js +302 -56
package/lib/audit-tools.js +412 -63
package/lib/audit.js +656 -35
package/lib/auth/jwt-external.js +17 -0
package/lib/auth/oauth.js +7 -0
package/lib/auth-bot-challenge.js +505 -0
package/lib/auth-header.js +92 -25
package/lib/backup/bundle.js +26 -0
package/lib/backup/index.js +512 -89
package/lib/backup/manifest.js +168 -7
package/lib/break-glass.js +415 -39
package/lib/budr.js +103 -30
package/lib/bundler.js +86 -66
package/lib/cache.js +192 -72
package/lib/chain-writer.js +65 -40
package/lib/circuit-breaker.js +56 -33
package/lib/cli-helpers.js +106 -75
package/lib/cli.js +6 -30
package/lib/cloud-events.js +99 -32
package/lib/cluster-storage.js +162 -37
package/lib/cluster.js +340 -49
package/lib/codepoint-class.js +66 -0
package/lib/compliance.js +424 -24
package/lib/config-drift.js +111 -46
package/lib/config.js +94 -40
package/lib/consent.js +165 -18
package/lib/constants.js +1 -0
package/lib/content-credentials.js +153 -48
package/lib/cookies.js +154 -62
package/lib/credential-hash.js +133 -61
package/lib/crypto-field.js +702 -18
package/lib/crypto-hpke.js +256 -0
package/lib/crypto.js +744 -22
package/lib/csv.js +178 -35
package/lib/daemon.js +456 -0
package/lib/dark-patterns.js +186 -55
package/lib/db-query.js +79 -2
package/lib/db.js +1431 -60
package/lib/ddl-change-control.js +523 -0
package/lib/deprecate.js +195 -40
package/lib/dev.js +82 -39
package/lib/dora.js +67 -48
package/lib/dr-runbook.js +368 -0
package/lib/dsr.js +142 -11
package/lib/dual-control.js +91 -56
package/lib/events.js +120 -41
package/lib/external-db-migrate.js +192 -2
package/lib/external-db.js +795 -50
package/lib/fapi2.js +122 -1
package/lib/fda-21cfr11.js +395 -0
package/lib/fdx.js +132 -2
package/lib/file-type.js +87 -0
package/lib/file-upload.js +93 -0
package/lib/flag.js +82 -20
package/lib/forms.js +132 -29
package/lib/framework-error.js +169 -0
package/lib/framework-schema.js +163 -35
package/lib/gate-contract.js +849 -175
package/lib/graphql-federation.js +68 -7
package/lib/guard-all.js +172 -55
package/lib/guard-archive.js +286 -124
package/lib/guard-auth.js +194 -21
package/lib/guard-cidr.js +190 -28
package/lib/guard-csv.js +397 -51
package/lib/guard-domain.js +213 -91
package/lib/guard-email.js +236 -29
package/lib/guard-filename.js +307 -75
package/lib/guard-graphql.js +263 -30
package/lib/guard-html.js +310 -116
package/lib/guard-image.js +243 -30
package/lib/guard-json.js +260 -54
package/lib/guard-jsonpath.js +235 -23
package/lib/guard-jwt.js +284 -30
package/lib/guard-markdown.js +204 -22
package/lib/guard-mime.js +190 -26
package/lib/guard-oauth.js +277 -28
package/lib/guard-pdf.js +251 -27
package/lib/guard-regex.js +226 -18
package/lib/guard-shell.js +229 -26
package/lib/guard-svg.js +177 -10
package/lib/guard-template.js +232 -21
package/lib/guard-time.js +195 -29
package/lib/guard-uuid.js +189 -30
package/lib/guard-xml.js +259 -36
package/lib/guard-yaml.js +241 -44
package/lib/honeytoken.js +63 -27
package/lib/html-balance.js +83 -0
package/lib/http-client.js +486 -59
package/lib/http-message-signature.js +582 -0
package/lib/i18n.js +102 -49
package/lib/iab-mspa.js +112 -32
package/lib/iab-tcf.js +107 -2
package/lib/inbox.js +90 -52
package/lib/keychain.js +865 -0
package/lib/legal-hold.js +374 -0
package/lib/local-db-thin.js +320 -0
package/lib/log-stream.js +281 -51
package/lib/log.js +184 -86
package/lib/mail-bounce.js +107 -62
package/lib/mail.js +295 -58
package/lib/mcp.js +108 -27
package/lib/metrics.js +98 -89
package/lib/middleware/age-gate.js +36 -0
package/lib/middleware/ai-act-disclosure.js +37 -0
package/lib/middleware/api-encrypt.js +45 -0
package/lib/middleware/assetlinks.js +40 -0
package/lib/middleware/asyncapi-serve.js +35 -0
package/lib/middleware/attach-user.js +40 -0
package/lib/middleware/bearer-auth.js +40 -0
package/lib/middleware/body-parser.js +230 -0
package/lib/middleware/bot-disclose.js +34 -0
package/lib/middleware/bot-guard.js +39 -0
package/lib/middleware/compression.js +37 -0
package/lib/middleware/cookies.js +32 -0
package/lib/middleware/cors.js +40 -0
package/lib/middleware/csp-nonce.js +40 -0
package/lib/middleware/csp-report.js +34 -0
package/lib/middleware/csrf-protect.js +43 -0
package/lib/middleware/daily-byte-quota.js +53 -85
package/lib/middleware/db-role-for.js +40 -0
package/lib/middleware/dpop.js +40 -0
package/lib/middleware/error-handler.js +37 -14
package/lib/middleware/fetch-metadata.js +39 -0
package/lib/middleware/flag-context.js +34 -0
package/lib/middleware/gpc.js +33 -0
package/lib/middleware/headers.js +35 -0
package/lib/middleware/health.js +46 -0
package/lib/middleware/host-allowlist.js +30 -0
package/lib/middleware/network-allowlist.js +38 -0
package/lib/middleware/openapi-serve.js +34 -0
package/lib/middleware/rate-limit.js +160 -18
package/lib/middleware/request-id.js +36 -18
package/lib/middleware/request-log.js +37 -0
package/lib/middleware/require-aal.js +29 -0
package/lib/middleware/require-auth.js +32 -0
package/lib/middleware/require-bound-key.js +41 -0
package/lib/middleware/require-content-type.js +32 -0
package/lib/middleware/require-methods.js +27 -0
package/lib/middleware/require-mtls.js +33 -0
package/lib/middleware/require-step-up.js +37 -0
package/lib/middleware/security-headers.js +44 -0
package/lib/middleware/security-txt.js +38 -0
package/lib/middleware/span-http-server.js +37 -0
package/lib/middleware/sse.js +36 -0
package/lib/middleware/trace-log-correlation.js +33 -0
package/lib/middleware/trace-propagate.js +32 -0
package/lib/middleware/tus-upload.js +90 -0
package/lib/middleware/web-app-manifest.js +53 -0
package/lib/mtls-ca.js +100 -70
package/lib/network-byte-quota.js +308 -0
package/lib/network-heartbeat.js +135 -0
package/lib/network-tls.js +534 -4
package/lib/network.js +103 -0
package/lib/notify.js +114 -43
package/lib/ntp-check.js +192 -51
package/lib/observability.js +145 -47
package/lib/openapi.js +90 -44
package/lib/outbox.js +99 -1
package/lib/pagination.js +168 -86
package/lib/parsers/index.js +16 -5
package/lib/permissions.js +93 -40
package/lib/pqc-agent.js +84 -8
package/lib/pqc-software.js +94 -60
package/lib/process-spawn.js +95 -21
package/lib/pubsub.js +96 -66
package/lib/queue.js +375 -54
package/lib/redact.js +793 -21
package/lib/render.js +139 -47
package/lib/request-helpers.js +485 -121
package/lib/restore-bundle.js +142 -39
package/lib/restore-rollback.js +136 -45
package/lib/retention.js +178 -50
package/lib/retry.js +116 -33
package/lib/router.js +475 -23
package/lib/safe-async.js +543 -94
package/lib/safe-buffer.js +337 -41
package/lib/safe-json.js +467 -62
package/lib/safe-jsonpath.js +285 -0
package/lib/safe-schema.js +631 -87
package/lib/safe-sql.js +221 -59
package/lib/safe-url.js +278 -46
package/lib/sandbox-worker.js +135 -0
package/lib/sandbox.js +358 -0
package/lib/scheduler.js +135 -70
package/lib/self-update.js +647 -0
package/lib/session-device-binding.js +431 -0
package/lib/session.js +259 -49
package/lib/slug.js +138 -26
package/lib/ssrf-guard.js +316 -56
package/lib/storage.js +433 -70
package/lib/subject.js +405 -23
package/lib/template.js +148 -8
package/lib/tenant-quota.js +545 -0
package/lib/testing.js +440 -53
package/lib/time.js +291 -23
package/lib/tls-exporter.js +239 -0
package/lib/tracing.js +90 -74
package/lib/uuid.js +97 -22
package/lib/vault/index.js +284 -22
package/lib/vault/seal-pem-file.js +66 -0
package/lib/watcher.js +368 -0
package/lib/webhook.js +196 -63
package/lib/websocket.js +393 -68
package/lib/wiki-concepts.js +338 -0
package/lib/worker-pool.js +464 -0
package/package.json +3 -3
package/sbom.cyclonedx.json +7 -7

package/lib/safe-url.js CHANGED Viewed

@@ -1,64 +1,186 @@
 "use strict";
 /**
- * URL-safe — validate URL scheme + shape against an allowlist.
- *
- * Per the framework's modernity stance: outbound network calls
- * REQUIRE TLS by default. Operators with internal cleartext
- * endpoints (development, behind-VPN services, internal mesh) opt in
- * explicitly via opts.allowedProtocols. The framework refuses to
- * silently drop bytes on the wire as cleartext.
- *
- * Public API:
- *
- *   safeUrl.parse(url, opts?) → URL
- *     Returns a parsed URL object. Throws if the URL is malformed
- *     or its protocol is not in the allowlist.
- *
- *   opts:
- *     allowedProtocols  — array of accepted protocol strings
- *                         (e.g. ["https:"] or safeUrl.ALLOW_HTTP_TLS).
- *                         Default: ALLOW_HTTP_TLS.
- *     errorClass        — FrameworkError subclass for the thrown
- *                         error. Lets callers (object-store,
- *                         log-stream, http-client) surface their
- *                         own decorated error class. Default:
- *                         SafeUrlError.
- *     allowUserinfo     — accept URLs that carry user:pass@ credentials
- *                         in the authority. Default: false. Userinfo in
- *                         outbound URLs leaks into request logs, error
- *                         messages, metric labels, and trace spans;
- *                         credential placement belongs in headers /
- *                         cookies / a credential store, not the URL.
- *                         Operators with a legacy endpoint that
- *                         REQUIRES userinfo opt in explicitly per call.
- *
- * Constants — pre-baked allowlists for the common caller cases:
- *
- *   ALLOW_HTTP_TLS   ["https:"]                       (the secure HTTP default)
- *   ALLOW_HTTP_ALL   ["http:", "https:"]              (HTTP + cleartext opt-in)
- *   ALLOW_WS_TLS     ["wss:"]                         (the secure WS default)
- *   ALLOW_WS_ALL     ["ws:", "wss:"]                  (WS + cleartext opt-in)
- *   ALLOW_ANY        ["http:", "https:", "ws:", "wss:"]
- *
- * Why per-call constants instead of one global "secure" list:
- *   The http-client only speaks HTTP, so wss:// is a category error
- *   (operator passed a WebSocket URL to a non-WebSocket client). Each
- *   caller declares its own narrow allowlist; an off-protocol URL
- *   fails with a clear "protocol not allowed here" error rather than
- *   trying and failing weirdly later.
+ * @module b.safeUrl
+ * @nav    Validation
+ * @title  Safe Url
+ *
+ * @intro
+ *   Defensive URL parsing with a protocol allowlist (HTTPS-only by
+ *   default), authority validation, IDN-homograph defense, and a
+ *   length cap that runs BEFORE Node's WHATWG URL parser sees the
+ *   input. The framework's stance on outbound URLs: TLS-required by
+ *   default; cleartext (`http:` / `ws:`) is opt-in per call via
+ *   `opts.allowedProtocols`. `user:pass@` userinfo refuses by
+ *   default — credentials belong in headers / a credential store,
+ *   not in URL strings that leak into request logs, error messages,
+ *   metric labels, and trace spans. Mixed-script host labels
+ *   (Cyrillic 'о' inside an otherwise-Latin label, etc. — UTS #39 §5
+ *   homograph shape) refuse by default and emit
+ *   `safeurl.idn_homograph.refused` to the audit chain so a forensic
+ *   review can reconstruct every accepted host.
+ *
+ *   Pre-baked protocol allowlists are exposed as frozen arrays so
+ *   each caller can declare a NARROW per-call allowlist (the
+ *   http-client speaks HTTP, not WebSocket; a `wss://` URL handed to
+ *   it is a category error that should fail loudly here, not later
+ *   inside a transport):
+ *
+ *     ALLOW_HTTP_TLS   ["https:"]                        (secure HTTP default)
+ *     ALLOW_HTTP_ALL   ["http:", "https:"]               (HTTP + cleartext opt-in)
+ *     ALLOW_WS_TLS     ["wss:"]                          (secure WS default)
+ *     ALLOW_WS_ALL     ["ws:", "wss:"]                   (WS + cleartext opt-in)
+ *     ALLOW_ANY        ["http:", "https:", "ws:", "wss:"]
+ *
+ *   `parse` throws `SafeUrlError` (or a caller-supplied error class
+ *   via `opts.errorClass`, used by `b.objectStore` / `b.logStream` /
+ *   `b.httpClient` to surface their own decorated error type) with a
+ *   stable `.code`: `safe-url/missing` / `safe-url/too-long` /
+ *   `safe-url/malformed` / `safe-url/protocol-disallowed` /
+ *   `safe-url/userinfo-disallowed` / `safe-url/idn-homograph` /
+ *   `safe-url/bad-opt`. Operator code that wants a boolean
+ *   parse-without-throw shape wraps the throw in a try / catch.
+ *
+ * @card
+ *   Defensive URL parsing with a protocol allowlist (HTTPS-only by default), authority validation, IDN-homograph defense, and a length cap that runs BEFORE Node's WHATWG URL parser sees the input.
  */
 var C = require("./constants");
+var codepointClass = require("./codepoint-class");
+var lazyRequire = require("./lazy-require");
 var numericBounds = require("./numeric-bounds");
 var { FrameworkError } = require("./framework-error");
+var nodeUrl = require("url");
 var { URL } = require("url");
+var audit = lazyRequire(function () { return require("./audit"); });
+/**
+ * @primitive b.safeUrl.ALLOW_HTTP_TLS
+ * @signature b.safeUrl.ALLOW_HTTP_TLS
+ * @since     0.1.0
+ * @status    stable
+ * @related   b.safeUrl.parse, b.safeUrl.ALLOW_HTTP_ALL
+ *
+ * Frozen protocol allowlist for HTTPS-only HTTP traffic — `["https:"]`.
+ * The framework default for any outbound URL parsed without an
+ * explicit `opts.allowedProtocols`. Operators with a legitimate
+ * cleartext use case opt in per call via `ALLOW_HTTP_ALL`.
+ *
+ * @example
+ *   var b = require("blamejs");
+ *   b.safeUrl.ALLOW_HTTP_TLS;
+ *   // → ["https:"]
+ */
 var ALLOW_HTTP_TLS = Object.freeze(["https:"]);
+/**
+ * @primitive b.safeUrl.ALLOW_HTTP_ALL
+ * @signature b.safeUrl.ALLOW_HTTP_ALL
+ * @since     0.1.0
+ * @status    stable
+ * @related   b.safeUrl.parse, b.safeUrl.ALLOW_HTTP_TLS
+ *
+ * Frozen protocol allowlist accepting both HTTP and HTTPS —
+ * `["http:", "https:"]`. Pass to `parse` when the call site
+ * legitimately speaks cleartext (loopback admin endpoints, on-prem
+ * service mesh terminating TLS at a sidecar, legacy partner APIs).
+ * Never the framework default — TLS-required is.
+ *
+ * @example
+ *   var b = require("blamejs");
+ *   var u = b.safeUrl.parse("http://127.0.0.1:8080/health", {
+ *     allowedProtocols: b.safeUrl.ALLOW_HTTP_ALL,
+ *   });
+ *   u.protocol;
+ *   // → "http:"
+ */
 var ALLOW_HTTP_ALL = Object.freeze(["http:", "https:"]);
+/**
+ * @primitive b.safeUrl.ALLOW_WS_TLS
+ * @signature b.safeUrl.ALLOW_WS_TLS
+ * @since     0.1.0
+ * @status    stable
+ * @related   b.safeUrl.parse, b.safeUrl.ALLOW_WS_ALL
+ *
+ * Frozen protocol allowlist for secure WebSocket traffic — `["wss:"]`.
+ * The framework default for any WebSocket URL parsed without an
+ * explicit `opts.allowedProtocols`.
+ *
+ * @example
+ *   var b = require("blamejs");
+ *   b.safeUrl.ALLOW_WS_TLS;
+ *   // → ["wss:"]
+ */
 var ALLOW_WS_TLS   = Object.freeze(["wss:"]);
+/**
+ * @primitive b.safeUrl.ALLOW_WS_ALL
+ * @signature b.safeUrl.ALLOW_WS_ALL
+ * @since     0.1.0
+ * @status    stable
+ * @related   b.safeUrl.parse, b.safeUrl.ALLOW_WS_TLS
+ *
+ * Frozen protocol allowlist accepting both `ws:` and `wss:` —
+ * `["ws:", "wss:"]`. Opt-in per call when cleartext WebSocket is
+ * acceptable (loopback dev, sidecar-terminated TLS).
+ *
+ * @example
+ *   var b = require("blamejs");
+ *   var u = b.safeUrl.parse("ws://127.0.0.1:9000/stream", {
+ *     allowedProtocols: b.safeUrl.ALLOW_WS_ALL,
+ *   });
+ *   u.protocol;
+ *   // → "ws:"
+ */
 var ALLOW_WS_ALL   = Object.freeze(["ws:", "wss:"]);
+/**
+ * @primitive b.safeUrl.ALLOW_ANY
+ * @signature b.safeUrl.ALLOW_ANY
+ * @since     0.1.0
+ * @status    stable
+ * @related   b.safeUrl.parse, b.safeUrl.ALLOW_HTTP_TLS
+ *
+ * Frozen allowlist accepting every framework-supported scheme —
+ * `["http:", "https:", "ws:", "wss:"]`. Suited to a generic
+ * URL-validation surface where the caller already enforces the
+ * protocol downstream; narrower allowlists are preferred wherever
+ * possible.
+ *
+ * @example
+ *   var b = require("blamejs");
+ *   b.safeUrl.ALLOW_ANY.length;
+ *   // → 4
+ */
 var ALLOW_ANY      = Object.freeze(["http:", "https:", "ws:", "wss:"]);
+/**
+ * @primitive b.safeUrl.SafeUrlError
+ * @signature b.safeUrl.SafeUrlError
+ * @since     0.1.0
+ * @status    stable
+ * @related   b.safeUrl.parse
+ *
+ * Error class thrown by `parse` (or by the caller-supplied
+ * `opts.errorClass`, used by `b.objectStore` / `b.logStream` /
+ * `b.httpClient` to surface a decorated operational error type).
+ * Extends `FrameworkError`. Carries a stable `.code`:
+ * `safe-url/missing` / `safe-url/too-long` / `safe-url/malformed` /
+ * `safe-url/protocol-disallowed` / `safe-url/userinfo-disallowed` /
+ * `safe-url/idn-homograph` / `safe-url/bad-opt`. HTTP middleware
+ * inspects `.code` to translate the throw into a 400 without
+ * leaking parser internals.
+ *
+ * @example
+ *   var b = require("blamejs");
+ *   try {
+ *     b.safeUrl.parse("ftp://example.com/file.txt");
+ *   } catch (e) {
+ *     e instanceof b.safeUrl.SafeUrlError;   // → true
+ *     e.code;                                // → "safe-url/protocol-disallowed"
+ *   }
+ */
 class SafeUrlError extends FrameworkError {
   constructor(code, message) {
     super(message, code);
@@ -83,6 +205,71 @@ function _makeError(errorClass, code, message) {
 // payloads) override via opts.maxUrlLength.
 var DEFAULT_MAX_URL_LENGTH = C.BYTES.kib(8);
+/**
+ * @primitive b.safeUrl.parse
+ * @signature b.safeUrl.parse(url, opts?)
+ * @since     0.1.0
+ * @status    stable
+ * @related   b.safeUrl.SafeUrlError, b.safeUrl.ALLOW_HTTP_TLS, b.safeUrl.ALLOW_HTTP_ALL
+ *
+ * Parse a URL string (or an existing `URL` instance) through the
+ * framework's defensive gates: length cap BEFORE Node's WHATWG parser
+ * sees the input (RFC 7230 §3.1.1 — 8 KiB default), protocol
+ * allowlist (`https:` only by default), `user:pass@` userinfo refusal
+ * (credentials leak into request logs / error messages / metric
+ * labels / trace spans), and per-label IDN-homograph defense
+ * (UTS #39 §5 mixed-script — Cyrillic 'о' inside an otherwise-Latin
+ * label). Returns the parsed `URL` instance on success.
+ *
+ * Throws `SafeUrlError` (or the caller-supplied `opts.errorClass`)
+ * with one of the documented `.code` strings: `safe-url/missing` /
+ * `safe-url/too-long` / `safe-url/malformed` /
+ * `safe-url/protocol-disallowed` / `safe-url/userinfo-disallowed` /
+ * `safe-url/idn-homograph` / `safe-url/bad-opt`. Operator code that
+ * wants a boolean parse-without-throw shape wraps the call in a
+ * `try` / `catch`.
+ *
+ * @opts
+ *   allowedProtocols: string[],   // default ALLOW_HTTP_TLS (["https:"])
+ *   maxUrlLength:     number,     // default 8192 (RFC 7230 §3.1.1)
+ *   allowUserinfo:    boolean,    // default false; opt-in to user:pass@
+ *   allowMixedScript: boolean,    // default false; opt-in to mixed-script labels
+ *   allowedScripts:   string[],   // narrow mixed-script allowlist (e.g. ["latin","cyrillic"])
+ *   errorClass:       Function,   // throw this instead of SafeUrlError (used by b.httpClient / b.objectStore)
+ *
+ * @example
+ *   var b = require("blamejs");
+ *
+ *   // Default: HTTPS-only, length cap, userinfo refused, IDN-homograph defended.
+ *   var u = b.safeUrl.parse("https://example.com/path?q=1");
+ *   u.hostname;
+ *   // → "example.com"
+ *
+ *   // Cleartext is opt-in per call via the ALLOW_HTTP_ALL preset.
+ *   var http = b.safeUrl.parse("http://127.0.0.1:8080/health", {
+ *     allowedProtocols: b.safeUrl.ALLOW_HTTP_ALL,
+ *   });
+ *   http.protocol;
+ *   // → "http:"
+ *
+ *   // Disallowed protocol throws SafeUrlError.
+ *   try { b.safeUrl.parse("javascript:alert(1)"); }
+ *   catch (e) { e.code; }
+ *   // → "safe-url/protocol-disallowed"
+ *
+ *   // Userinfo refused by default — credentials belong in headers.
+ *   try { b.safeUrl.parse("https://alice:s3cr3t@example.com/"); }
+ *   catch (e) { e.code; }
+ *   // → "safe-url/userinfo-disallowed"
+ *
+ *   // Boolean parse-without-throw shape via try/catch wrapper.
+ *   function isValid(s) {
+ *     try { b.safeUrl.parse(s); return true; }
+ *     catch (_e) { return false; }
+ *   }
+ *   isValid("https://example.com/");   // → true
+ *   isValid("ftp://example.com/");     // → false
+ */
 function parse(url, opts) {
   opts = opts || {};
   var allowed = Array.isArray(opts.allowedProtocols) && opts.allowedProtocols.length > 0
@@ -145,6 +332,51 @@ function parse(url, opts) {
       "reads at call time), or pass opts.allowUserinfo: true to opt this URL in.");
   }
+  // IDN homograph defense — each host label MUST be single-script
+  // (UTS #39 §5). A label that mixes Cyrillic + Latin (e.g. `gооgle.com`
+  // with Cyrillic 'о' inside the otherwise-Latin label) presents
+  // visually as a trusted host while resolving via DNS to attacker-
+  // controlled infrastructure. Defaults to refuse; operators with
+  // legitimate non-Latin host labels opt in via `allowMixedScript: true`
+  // and the opt-in audits with the host so a forensic review can
+  // reconstruct which call sites accept mixed-script hosts. Per-label
+  // detection (not whole-host) so a legitimate `eu.shop.example.org`
+  // mixing Latin + Cyrillic across labels still refuses. Node's URL
+  // parser normalizes IDN hosts to Punycode (`xn--`), so we decode each
+  // label to Unicode first via nodeUrl.domainToUnicode and run the
+  // mixed-script catalog on the decoded codepoints.
+  if (opts.allowMixedScript !== true && parsed.hostname) {
+    var unicodeHost;
+    try { unicodeHost = nodeUrl.domainToUnicode(parsed.hostname); }
+    catch (_e) { unicodeHost = parsed.hostname; }
+    var labels = (unicodeHost || parsed.hostname).split(".");
+    var allowedScripts = Array.isArray(opts.allowedScripts) ? opts.allowedScripts : null;
+    for (var li = 0; li < labels.length; li += 1) {
+      var label = labels[li];
+      if (label.length === 0) continue;
+      var mixed = codepointClass.detectMixedScripts(label, allowedScripts);
+      if (mixed) {
+        try {
+          audit().safeEmit({
+            action:  "safeurl.idn_homograph.refused",
+            outcome: "denied",
+            metadata: {
+              host:    parsed.hostname,
+              label:   label,
+              scripts: mixed,
+            },
+          });
+        } catch (_e) { /* audit best-effort */ }
+        throw _makeError(errClass, "safe-url/idn-homograph",
+          "URL host label '" + label + "' mixes scripts (" + mixed.join(", ") +
+          ") — IDN homograph attack shape (UTS #39 §5). Refuses by default; " +
+          "operators with a legitimate mixed-script host pass " +
+          "opts.allowMixedScript: true (with an audited reason) or " +
+          "opts.allowedScripts: ['latin','cyrillic'] to allowlist specific scripts.");
+      }
+    }
+  }
   return parsed;
 }

package/lib/sandbox-worker.js ADDED Viewed

@@ -0,0 +1,135 @@
+"use strict";
+/**
+ * sandbox-worker — bootstrap module loaded inside the worker_threads
+ * Worker spawned by lib/sandbox.js. Runs UNTRUSTED operator-supplied
+ * source against a pre-stripped global scope.
+ *
+ * NOT operator-facing — operators interact via b.sandbox.run().
+ *
+ * Wire format:
+ *   workerData: {
+ *     source:          string,    // operator-supplied JS — function body
+ *     input:           any,       // pass-through input
+ *     allowedGlobals:  string[],  // intersected with KNOWN_SAFE_BUILTINS
+ *     maxResultBytes:  number,    // hard-cap on JSON.stringify(result)
+ *   }
+ *
+ * Posts back via parentPort:
+ *   { ok: true,  resultJson, runtimeMs, peakBytes }
+ *   { ok: false, code, message, runtimeMs, peakBytes }
+ *
+ * Containment summary:
+ *   - require / process / Buffer / setTimeout / setInterval / setImmediate /
+ *     queueMicrotask / global are deleted off globalThis before the
+ *     operator code is compiled.
+ *   - The operator source is compiled via the JS language's
+ *     string-to-callable primitive — the compiled function's outer
+ *     scope is GLOBAL (stripped) and CANNOT see the bootstrap's
+ *     own locals (require, workerThreads, parentPort).
+ *   - Resource limits (maxOldGenerationSizeMb / maxYoungGenerationSizeMb /
+ *     codeRangeSizeMb / stackSizeMb) are set by the host on Worker
+ *     construction; v8 kills the worker on heap overflow.
+ *   - Output is JSON-serialized; the worker refuses any result whose
+ *     stringified form exceeds maxResultBytes.
+ */
+var workerThreads = require("node:worker_threads");
+(function () {
+  var data = workerThreads.workerData || {};
+  var allowed = Array.isArray(data.allowedGlobals) ? data.allowedGlobals : [];
+  var maxResultBytes = (typeof data.maxResultBytes === "number") ? data.maxResultBytes : null;
+  var ALWAYS_AVAILABLE = [
+    "Object", "Array", "String", "Number", "Boolean", "Symbol",
+    "Promise", "Error", "TypeError", "RangeError", "RegExp",
+  ];
+  var keep = Object.create(null);
+  for (var i = 0; i < ALWAYS_AVAILABLE.length; i += 1) keep[ALWAYS_AVAILABLE[i]] = true;
+  for (var j = 0; j < allowed.length; j += 1) keep[allowed[j]] = true;
+  var NODE_BUILTINS = [
+    "process", "Buffer",
+    "setImmediate", "clearImmediate",
+    "setTimeout", "clearTimeout",
+    "setInterval", "clearInterval",
+    "queueMicrotask",
+    "global",
+  ];
+  for (var k = 0; k < NODE_BUILTINS.length; k += 1) {
+    var nm = NODE_BUILTINS[k];
+    if (!keep[nm]) {
+      try { delete globalThis[nm]; }
+      catch (_e1) { try { globalThis[nm] = undefined; } catch (_e2) { /* best-effort */ } }
+    }
+  }
+  try { delete globalThis.require; } catch (_e) { /* best-effort */ }
+  var startedAt = Date.now();
+  var peakBytes = 0;
+  function snapshotPeak() {
+    try {
+      var proc = (typeof process !== "undefined") ? process : null;
+      if (proc && typeof proc.memoryUsage === "function") {
+        var u = proc.memoryUsage();
+        if (u && typeof u.heapUsed === "number" && u.heapUsed > peakBytes) peakBytes = u.heapUsed;
+      }
+    } catch (_e) { /* process gone or stripped */ }
+  }
+  snapshotPeak();
+  // Compile operator source via the JS language's string-to-callable
+  // primitive. The compiled function's outer scope is GLOBAL (already
+  // stripped above); it cannot see this bootstrap's own locals.
+  var Compiler = (function () { return Function; }());
+  var fn;
+  try {
+    fn = new Compiler("input", data.source);
+  } catch (eParse) {
+    workerThreads.parentPort.postMessage({
+      ok: false, code: "sandbox/parse-error",
+      message: "sandbox source did not parse: " + (eParse && eParse.message),
+      runtimeMs: Date.now() - startedAt, peakBytes: peakBytes,
+    });
+    return;
+  }
+  try {
+    var result = fn(data.input);
+    snapshotPeak();
+    var runtimeMs = Date.now() - startedAt;
+    var serialized;
+    try { serialized = (result === undefined) ? undefined : JSON.stringify(result); }
+    catch (eSer) {
+      workerThreads.parentPort.postMessage({
+        ok: false, code: "sandbox/result-not-serializable",
+        message: "sandbox result is not JSON-serializable: " + (eSer && eSer.message),
+        runtimeMs: runtimeMs, peakBytes: peakBytes,
+      });
+      return;
+    }
+    if (maxResultBytes !== null && serialized && serialized.length > maxResultBytes) {
+      workerThreads.parentPort.postMessage({
+        ok: false, code: "sandbox/oversized-result",
+        message: "sandbox result exceeded maxResultBytes (" + serialized.length + " > " + maxResultBytes + ")",
+        runtimeMs: runtimeMs, peakBytes: peakBytes,
+      });
+      return;
+    }
+    workerThreads.parentPort.postMessage({
+      ok: true, resultJson: serialized, runtimeMs: runtimeMs, peakBytes: peakBytes,
+    });
+  } catch (eRun) {
+    snapshotPeak();
+    workerThreads.parentPort.postMessage({
+      ok: false, code: "sandbox/runtime-error",
+      message: "sandbox transform threw: " + (eRun && eRun.message ? eRun.message : String(eRun)),
+      runtimeMs: Date.now() - startedAt, peakBytes: peakBytes,
+    });
+  }
+}());