npm - @trusty-squire/mcp - Versions diffs - 0.6.14-rc.2 → 0.6.14-rc.21 - Mend

@trusty-squire/mcp 0.6.14-rc.2 → 0.6.14-rc.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (72) hide show

package/LICENSE +21 -0
package/dist/api-client.d.ts +45 -0
package/dist/api-client.d.ts.map +1 -1
package/dist/api-client.js +43 -0
package/dist/api-client.js.map +1 -1
package/dist/bin.js +12 -0
package/dist/bin.js.map +1 -1
package/dist/bot/agent.d.ts +35 -2
package/dist/bot/agent.d.ts.map +1 -1
package/dist/bot/agent.js +525 -38
package/dist/bot/agent.js.map +1 -1
package/dist/bot/browser.d.ts +8 -0
package/dist/bot/browser.d.ts.map +1 -1
package/dist/bot/browser.js +193 -20
package/dist/bot/browser.js.map +1 -1
package/dist/bot/index.d.ts +4 -2
package/dist/bot/index.d.ts.map +1 -1
package/dist/bot/index.js +17 -3
package/dist/bot/index.js.map +1 -1
package/dist/bot/llm-client.d.ts +1 -1
package/dist/bot/llm-client.d.ts.map +1 -1
package/dist/bot/onboarding-capture.d.ts +3 -0
package/dist/bot/onboarding-capture.d.ts.map +1 -1
package/dist/bot/onboarding-capture.js +70 -5
package/dist/bot/onboarding-capture.js.map +1 -1
package/dist/bot/promote-to-skill.d.ts +2 -1
package/dist/bot/promote-to-skill.d.ts.map +1 -1
package/dist/bot/promote-to-skill.js +214 -29
package/dist/bot/promote-to-skill.js.map +1 -1
package/dist/bot/replay-skill.d.ts +4 -0
package/dist/bot/replay-skill.d.ts.map +1 -1
package/dist/bot/replay-skill.js +300 -3
package/dist/bot/replay-skill.js.map +1 -1
package/dist/install/cli.d.ts +16 -0
package/dist/install/cli.d.ts.map +1 -1
package/dist/install/cli.js +63 -6
package/dist/install/cli.js.map +1 -1
package/dist/server.d.ts.map +1 -1
package/dist/server.js +1 -0
package/dist/server.js.map +1 -1
package/dist/session.d.ts.map +1 -1
package/dist/session.js +15 -5
package/dist/session.js.map +1 -1
package/dist/skill-cli/cli.d.ts +25 -0
package/dist/skill-cli/cli.d.ts.map +1 -1
package/dist/skill-cli/cli.js +558 -13
package/dist/skill-cli/cli.js.map +1 -1
package/dist/skill-cli/registry-http.d.ts +1 -0
package/dist/skill-cli/registry-http.d.ts.map +1 -1
package/dist/skill-cli/registry-http.js +3 -0
package/dist/skill-cli/registry-http.js.map +1 -1
package/dist/skill-cli/signing.d.ts +21 -0
package/dist/skill-cli/signing.d.ts.map +1 -0
package/dist/skill-cli/signing.js +71 -0
package/dist/skill-cli/signing.js.map +1 -0
package/dist/skill-registry-client.d.ts +2 -0
package/dist/skill-registry-client.d.ts.map +1 -1
package/dist/skill-registry-client.js +83 -36
package/dist/skill-registry-client.js.map +1 -1
package/dist/tools/extract-failures.d.ts +23 -0
package/dist/tools/extract-failures.d.ts.map +1 -0
package/dist/tools/extract-failures.js +108 -0
package/dist/tools/extract-failures.js.map +1 -0
package/dist/tools/index.d.ts +2 -1
package/dist/tools/index.d.ts.map +1 -1
package/dist/tools/index.js +6 -1
package/dist/tools/index.js.map +1 -1
package/dist/tools/provision-any.d.ts +7 -0
package/dist/tools/provision-any.d.ts.map +1 -1
package/dist/tools/provision-any.js +346 -45
package/dist/tools/provision-any.js.map +1 -1
package/package.json +16 -15

package/dist/bot/agent.js CHANGED Viewed

@@ -15,6 +15,7 @@ import { saveDebugSnapshot } from "./debug.js";
 import { captureOnboardingRound } from "./onboarding-capture.js";
 import { wasRecentlyPrewarmed, recordPrewarmSuccess } from "./prewarm-cache.js";
 import { pickLLMPair, } from "./llm-client.js";
+import { getDomain } from "tldts";
 // Hard cap on LLM calls per signup. A signup that runs away to 20+ calls
 // is both expensive and almost certainly stuck in a planning loop. 15
 // covers: 2 initial form plans, 1 re-plan pair on validation, plus 6
@@ -131,6 +132,17 @@ export function guessSignupUrl(service) {
     const host = entry ?? `${slug}.com`;
     return `https://${host}/signup`;
 }
+// BUG-2 GUARD — did `url` come from KNOWN_DOMAINS as a hardcoded full
+// URL (vs the default /signup convention)? These were explicitly
+// chosen because the default 404s and the real entry is non-obvious
+// — e.g. Railway's /login, Cloudflare's dash.cloudflare.com/sign-up.
+// Trust the mapping rather than falling back to a Google search.
+// Exported for unit testing.
+export function isKnownDomainFullUrlMatch(service, url) {
+    const slug = service.toLowerCase().replace(/[^a-z0-9]/g, "");
+    const entry = KNOWN_DOMAINS[slug];
+    return entry !== undefined && /^https?:\/\//i.test(entry) && entry === url;
+}
 // True when the URL is a Google search results page — used to gate
 // the prewarm + the post-load "did we land somewhere useful?" check.
 export function isGoogleSearchUrl(url) {
@@ -314,6 +326,39 @@ export function formatInventory(inventory) {
                 ? `value="" (EMPTY — fill before submitting)`
                 : `value=${JSON.stringify(e.value.slice(0, 60))}`);
         }
+        // <select> state. `value=""` is the React-defaulted-placeholder
+        // pattern (the first option's value is empty, common for
+        // "No workspace" / "Select…" / "Choose…" prompts). React Hook
+        // Form treats those fields as untouched and silently rejects
+        // submits — Railway's token-creation form was the canonical
+        // case. The planner needs the selected text and the option
+        // list to issue an explicit `select` step before clicking
+        // submit. Selectors run to end-of-line, so this annotation goes
+        // BEFORE the trailing `selector=`.
+        //
+        // rc.17: suppress the DEFAULTED marker for selects we've already
+        // selected (data-ts-touched). A successful selectOption to a
+        // value="" option leaves value=="" but the form-state is
+        // committed — without this suppression the planner would see
+        // DEFAULTED again next round and re-select indefinitely.
+        if (e.tag === "select") {
+            const selectedText = e.selectedOptionText ?? "";
+            const isDefaulted = e.value !== null && e.value !== undefined && e.value.length === 0;
+            const alreadyTouched = e.interactedThisRun === true;
+            bits.push(isDefaulted && !alreadyTouched
+                ? `value="" selected=${JSON.stringify(selectedText)} (DEFAULTED — pick an explicit option before submitting)`
+                : `value=${JSON.stringify((e.value ?? "").slice(0, 60))} selected=${JSON.stringify(selectedText)}${alreadyTouched ? " (touched — already selected by bot)" : ""}`);
+            if (e.selectOptions !== null && e.selectOptions !== undefined && e.selectOptions.length > 0) {
+                const optionTexts = e.selectOptions
+                    .map((o) => o.text || `(value=${JSON.stringify(o.value)})`)
+                    .filter((t) => t.length > 0)
+                    .slice(0, 6)
+                    .map((t) => JSON.stringify(t))
+                    .join(", ");
+                if (optionTexts.length > 0)
+                    bits.push(`options=[${optionTexts}]`);
+            }
+        }
         const label = e.labelText ?? e.ariaLabel;
         if (label !== null && label !== undefined) {
             bits.push(`label=${JSON.stringify(label)}`);
@@ -331,6 +376,120 @@ export function formatInventory(inventory) {
     })
         .join("\n");
 }
+// Platform-as-a-service customer-tenant suffixes that the bundled PSL
+// in `tldts` does NOT (yet) classify as public suffixes, but functionally
+// behave like one: every label to the left is a distinct customer site,
+// not an extension of the platform's own brand.
+//
+// Without this override, `getDomain("storysite-production.up.railway.app")`
+// returns `"railway.app"` (first label "railway") and the guard wrongly
+// matches it to slug "railway" — which is exactly the Railway bug this
+// guard is meant to prevent.
+//
+// Keep this list short: only platforms where serving arbitrary 3rd-party
+// content on `*.<suffix>` is the platform's primary purpose. Custom-domain-
+// only platforms (e.g. heroku custom domains) don't belong here.
+//
+// Order matters — most-specific first. We pick the longest suffix the
+// hostname ends with.
+const PLATFORM_TENANT_SUFFIXES = [
+    "up.railway.app",
+    "railway.app",
+    "vercel.app",
+    "netlify.app",
+    "pages.dev",
+    "fly.dev",
+    "onrender.com",
+    "herokuapp.com",
+    "github.io",
+    "gitlab.io",
+    "workers.dev",
+];
+// Treat `hostname` as if `suffix` were a public suffix: return the label
+// immediately to the left of the suffix, lowercased. Returns null if the
+// hostname doesn't end with the suffix.
+function tenantLabelUnderPlatformSuffix(hostname, suffix) {
+    const lc = hostname.toLowerCase();
+    const dotSuffix = `.${suffix}`;
+    if (!lc.endsWith(dotSuffix))
+        return null;
+    const head = lc.slice(0, -dotSuffix.length);
+    if (head.length === 0)
+        return null;
+    // The tenant label is the LAST label of head (rightmost-before-suffix).
+    const parts = head.split(".");
+    return parts[parts.length - 1] ?? null;
+}
+// BUG-1 GUARD — does `hostname` belong to the same registered domain as
+// `serviceSlug` (the alphanumeric squashed service name like "railway",
+// "postmark")?
+//
+// Uses PSL-aware eTLD+1 (via tldts) AND a hardcoded override for
+// platform-tenant suffixes the bundled PSL doesn't cover yet, so platform
+// subdomains like `*.up.railway.app` and `*.vercel.app` are correctly
+// classified as distinct customer sites.
+//
+//   railway.com                          ↔ slug "railway" → MATCH
+//   docs.railway.com                     ↔ slug "railway" → MATCH
+//   storysite-production.up.railway.app  ↔ slug "railway" → REJECT
+//                                          (matched by platform override —
+//                                          tenant label is "storysite-production",
+//                                          not "railway")
+//   railway.app                          ↔ slug "railway" → MATCH
+//                                          (the apex itself is the platform's
+//                                          own brand; only labels to the left
+//                                          are tenant sites)
+//   railway.io (typosquat)               ↔ slug "railway" → MATCH
+//                                          (intentional — we can't disambiguate
+//                                          typosquats from TLD variants like
+//                                          sentry.com vs sentry.io)
+//
+// Empty slug → permissive (return true), preserving prior behavior when
+// no service name was provided to findSignupLink.
+//
+// Exported for unit testing.
+export function hostMatchesServiceDomain(hostname, serviceSlug) {
+    if (serviceSlug.length === 0)
+        return true;
+    const lcHost = hostname.toLowerCase();
+    // Platform-tenant override: if hostname is `*.<platform-suffix>`, the
+    // tenant label (left of the suffix) is the "site name", not the
+    // platform's brand. Pick the LONGEST matching suffix so e.g.
+    // "x.up.railway.app" picks "up.railway.app" before "railway.app".
+    let bestSuffix = null;
+    for (const sfx of PLATFORM_TENANT_SUFFIXES) {
+        if (lcHost.endsWith(`.${sfx}`) &&
+            (bestSuffix === null || sfx.length > bestSuffix.length)) {
+            bestSuffix = sfx;
+        }
+    }
+    if (bestSuffix !== null) {
+        const tenant = tenantLabelUnderPlatformSuffix(lcHost, bestSuffix);
+        if (tenant === null)
+            return false;
+        const normalizedTenant = tenant.replace(/[^a-z0-9]/g, "");
+        return normalizedTenant === serviceSlug;
+    }
+    const registered = getDomain(lcHost);
+    if (registered === null)
+        return false;
+    // The first label of the eTLD+1 is the "site name". For railway.com
+    // that's "railway".
+    const firstLabel = registered.split(".")[0]?.toLowerCase() ?? "";
+    // Normalize: strip hyphens so "trusty-squire" matches slug "trustysquire".
+    const normalized = firstLabel.replace(/[^a-z0-9]/g, "");
+    return normalized === serviceSlug;
+}
+// BUG-3 GUARD — diagnostic flag for the Inventory snapshot. Stricter
+// than detectAntiBotBlock (no "cf-turnstile" / "recaptcha" raw-HTML
+// matches) because the previous regex false-positive matched legitimate
+// signup pages that just embed a Turnstile/reCAPTCHA widget script.
+// Match on visible-text patterns only.
+//
+// Exported for unit testing.
+export function isAntiBotInterstitialText(visibleText) {
+    return /just a moment|verify you are human|attention required|are you a robot|checking your browser/i.test(visibleText);
+}
 // Recognize a full-page anti-bot interstitial that's still up. Returns
 // the vendor name (for the status message) or null. Pattern matching
 // on visible text rather than markers — most vendors use the same UX
@@ -351,24 +510,80 @@ export function detectAntiBotBlock(html) {
         return "Imperva";
     return null;
 }
-// F17 — True when the inventory looks like an authenticated
-// dashboard rather than a sign-up page. Triggers when a prior OAuth
-// bind already linked the account and the service auto-redirects
-// past the sign-in widget on the next visit. Detection signals:
-//   - At least one element whose visible text matches an
-//     authenticated-state keyword (Sign out / Log out / Dashboard /
-//     Projects / Settings / Profile / Account)
-//   - No email/password input fields visible (a true sign-up page
-//     virtually always has at least one)
-// Conservative — both conditions must hold.
-export function detectAlreadySignedIn(inventory) {
-    const AUTH_KEYWORDS = /^\s*(?:sign out|log out|dashboard|projects|settings|profile|my account|account settings|workspaces)\s*$/i;
-    const hasAuthMarker = inventory.some((e) => AUTH_KEYWORDS.test((e.visibleText ?? e.ariaLabel ?? "").trim()));
-    if (!hasAuthMarker)
-        return false;
+// F17 — True when the page looks like an authenticated dashboard
+// rather than a sign-up page. Triggers when a prior OAuth bind
+// already linked the account and the service auto-redirects past
+// the sign-in widget on the next visit.
+//
+// **Universal precondition**: no email/password/tel input visible.
+// A true sign-up page virtually always has at least one; if any
+// such input is present, we are NOT authenticated regardless of
+// what other markers the page carries.
+//
+// **Positive signals (any one fires authentication)**:
+//   1. Explicit nav keyword (Sign out / Log out / Dashboard /
+//      Projects / Settings / Profile / Account / Workspaces) —
+//      the canonical strict-match path. Works for Sentry,
+//      OpenRouter, Postmark, etc. — sites with a real nav bar.
+//   2. Billing / trial widget visible ("$X.XX left", "N days left",
+//      "Trial") — these only render to authenticated users. Caught
+//      Railway's `/new` page where the only post-login marker was
+//      the "28 days or $5.00 leftTrial" button.
+//   3. Dashboard-route URL (path contains /new, /dashboard,
+//      /projects, /account, /settings, /workspace) AND a creation
+//      CTA visible ("New project", "Create", "New <X>") — paired
+//      signal that catches sparse SPAs whose entire layout is a
+//      single create-form on a logged-in URL.
+//
+// rc.18: signals 2 and 3 added. Previously only signal 1 was
+// checked; Railway's project-creation widget tripped the form-fill
+// fallback (and a low-confidence LLM plan that filled "Empty
+// Project" then waited for a verification email that never came).
+export function detectAlreadySignedIn(args) {
+    const { inventory, url } = args;
+    // Precondition: any visible credential input → not authenticated.
     const hasCredentialInput = inventory.some((e) => e.tag === "input" &&
         (e.type === "email" || e.type === "password" || e.type === "tel"));
-    return !hasCredentialInput;
+    if (hasCredentialInput)
+        return false;
+    const visibleTextOf = (e) => `${e.visibleText ?? ""} ${e.ariaLabel ?? ""}`.trim();
+    // Signal 1 — strict nav-keyword match (the canonical Sentry-class case).
+    const AUTH_KEYWORDS = /^\s*(?:sign out|log out|dashboard|projects|settings|profile|my account|account settings|workspaces)\s*$/i;
+    if (inventory.some((e) => AUTH_KEYWORDS.test((e.visibleText ?? e.ariaLabel ?? "").trim()))) {
+        return true;
+    }
+    // Signal 2 — billing / trial widget. Patterns observed in the wild:
+    //   "28 days or $5.00 leftTrial" (Railway, no separator)
+    //   "Trial" (most SaaS)
+    //   "$N left" / "N days left" / "remaining"
+    const BILLING = /(?:\$\d+(?:\.\d+)?\s*(?:left|remaining)|\d+\s*days?\s*(?:left|remaining|trial)|\btrial\b)/i;
+    if (inventory.some((e) => BILLING.test(visibleTextOf(e)))) {
+        return true;
+    }
+    // Signal 3 — dashboard-route URL + creation CTA visible.
+    // The URL gate is conservative: a path that READS as dashboard,
+    // not /login or /signup or /. Combined with a creation CTA
+    // ("New project", "Create workspace", "+ New") it pins the
+    // page as a post-login surface.
+    let dashboardyPath = false;
+    try {
+        const parsed = new URL(url);
+        dashboardyPath =
+            /\/(?:new|dashboard|projects?|account|settings|workspace|home)(?:\/|$)/i.test(parsed.pathname) && !/\/(?:signup|sign-up|register|login|sign-in|signin)/i.test(parsed.pathname);
+    }
+    catch {
+        // Malformed URL — skip URL signal.
+    }
+    if (dashboardyPath) {
+        const CREATION_CTA = /^\s*(?:\+\s*)?(?:new\s+(?:project|workspace|team|app|site|deployment|api\s*key)|create(?:\s+(?:new|a|project|workspace))?)/i;
+        if (inventory.some((e) => {
+            const t = e.visibleText ?? e.ariaLabel ?? "";
+            return CREATION_CTA.test(t.trim());
+        })) {
+            return true;
+        }
+    }
+    return false;
 }
 // True when the page has no fillable text input AND no button that
 // reads as an email-signup option — a genuinely OAuth/SSO-only
@@ -844,8 +1059,13 @@ export class SignupAgent {
                 steps.push(`Dismissed cookie consent: "${dismissed}"`);
             }
             await saveDebugSnapshot(this.browser, "before-fill");
-            const state = await this.browser.getState();
-            const inventory = await this.buildInventory(steps, oauthCandidates);
+            // PERF: getState() (page.content + title + screenshot) and
+            // extractInteractiveElements (DOM walk) are independent
+            // Playwright calls — fire them in parallel.
+            const [state, inventory] = await Promise.all([
+                this.browser.getState(),
+                this.buildInventory(steps, oauthCandidates),
+            ]);
             // OAuth-first (T6/T13 + auto-prefer): when the page carries a
             // "Sign in with <provider>" affordance for a provider the bot can
             // use, that button unconditionally outranks any form field — hand
@@ -883,8 +1103,8 @@ export class SignupAgent {
                 // path entirely and route to the post-OAuth navigation loop
                 // to find the API key — same path Sentry/OpenRouter use post-
                 // handshake.
-                if (detectAlreadySignedIn(inventory)) {
-                    steps.push("Auto-OAuth: page shows dashboard markers (Sign out / Dashboard / etc.) — " +
+                if (detectAlreadySignedIn({ inventory, url: state.url })) {
+                    steps.push("Auto-OAuth: page shows authenticated-state markers (nav keyword, billing widget, or dashboard URL + create CTA) — " +
                         "treating as already authenticated, jumping to post-verify navigation");
                     return { kind: "already_oauth" };
                 }
@@ -1029,7 +1249,10 @@ export class SignupAgent {
                 steps.push(`⚠ submit click failed: ${reason}`);
                 return { kind: "submit_failed", reason };
             }
-            await this.browser.wait(5);
+            // PERF: 5s was overcautious — runCaptchaGate has its own wait
+            // for the captcha widget to render, and waitForFormReady at
+            // the next planner iteration handles SPA settle.
+            await this.browser.wait(2);
             const postGate = await this.runCaptchaGate("Post-submit", steps);
             if (postGate.blocked)
                 return { kind: "captcha_blocked", captchaKind: postGate.kind };
@@ -1089,7 +1312,11 @@ export class SignupAgent {
                     .replace(/\s+/g, " ")
                     .trim()
                     .slice(0, 240);
-                const antiBot = /just a moment|verify you are human|attention required|cloudflare|cf-challenge|cf-turnstile|recaptcha|are you a robot/i.test(state.html);
+                // BUG-3 FIX: match on user-visible text only. Previous regex
+                // hit `cf-turnstile` / `recaptcha` / `cloudflare` in raw HTML,
+                // false-positive-firing on legitimate signup pages that embed
+                // a Turnstile widget script.
+                const antiBot = isAntiBotInterstitialText(text);
                 steps.push(`Inventory diagnostic: title=${JSON.stringify(state.title.slice(0, 80))} ` +
                     `url=${state.url.slice(0, 120)} text=${JSON.stringify(text)}` +
                     (antiBot ? " ⚠ anti-bot interstitial detected" : ""));
@@ -1177,7 +1404,20 @@ export class SignupAgent {
         }
         return misses.length > 0 ? misses.join(", ") : null;
     }
-    constructor(browser, llm) {
+    // Diagnostic uploader — best-effort. When set, the post-verify
+    // loop uploads the current DOM + screenshot to the registry-api
+    // after a failed extract pass, so UI-shape regressions can be
+    // diagnosed without users needing to configure debug env vars.
+    // Wired from the MCP layer; undefined in unit-test contexts.
+    extractFailureUploader;
+    // Per-round telemetry uploader (0.6.14-rc.11). Fires on every post-
+    // verify round so the registry has the full DOM + screenshot trail
+    // for any stuck signup, not just the ones that fail at extract.
+    roundUploader;
+    // Set per-task in signup(). Lets the uploader know which service
+    // was being provisioned without threading it through every call.
+    currentService = "";
+    constructor(browser, llm, opts = {}) {
         this.browser = browser;
         if (llm === undefined) {
             this.llmPair = pickLLMPair({ preferCheap: PREFER_CHEAP_LLM });
@@ -1192,6 +1432,12 @@ export class SignupAgent {
             // case. Tests and the MCP-Sampling future path use this.
             this.llmPair = { primary: llm, premium: null };
         }
+        if (opts.extractFailureUploader !== undefined) {
+            this.extractFailureUploader = opts.extractFailureUploader;
+        }
+        if (opts.roundUploader !== undefined) {
+            this.roundUploader = opts.roundUploader;
+        }
     }
     // Read-only view of how many calls landed on which backend. Exported
     // through SignupResult.llm_backends so tests and ops can verify the
@@ -1303,6 +1549,10 @@ export class SignupAgent {
         // (Google number-match etc.). Without it, the run still works —
         // steps are just only visible in the final result.
         const steps = task.stepsSink ?? [];
+        // Stash the service name so the diagnostic uploader (called from
+        // deep inside postVerifyLoop after a failed extract) can label
+        // the snapshot without us threading task through every method.
+        this.currentService = task.service;
         const rawTimeout = Number(process.env.UNIVERSAL_BOT_RUN_TIMEOUT_MS);
         const timeoutMs = Number.isFinite(rawTimeout) && rawTimeout > 0 ? rawTimeout : 600_000;
         let timer;
@@ -1378,18 +1628,32 @@ export class SignupAgent {
             }
             steps.push(`Navigating to ${signupUrl}`);
             await this.browser.goto(signupUrl);
-            await this.browser.wait(2);
+            // PERF: goto() awaits domcontentloaded; the subsequent
+            // waitForFormReady in planExecuteWithRetry handles SPA settle.
+            // No need for a blind 2s dwell here.
             // When we *guessed* (no signup_url provided) and the page after
             // load doesn't look like a signup page — no inputs, no OAuth
             // affordance, or an obvious 404/error title — fall back to the
             // search-and-find-link path. This is the safety net that lets
             // the bot recover from a wrong canonical guess (e.g. a service
             // that uses /register or a non-`.com` TLD).
-            if (task.signupUrl === undefined && !(await this.looksLikeSignupPage())) {
+            //
+            // BUG-2 GUARD: when the guessed URL came from KNOWN_DOMAINS as a
+            // full hardcoded URL (e.g. Railway → https://railway.com/login,
+            // Cloudflare → https://dash.cloudflare.com/sign-up), trust the
+            // mapping. These were explicitly chosen because the default
+            // /signup path 404s and the real entry is non-obvious — falling
+            // back to a Google search has produced cross-domain bugs (the
+            // Railway run that ended up on storysite-production.up.railway.app).
+            const usedKnownFullUrl = isKnownDomainFullUrlMatch(task.service, guessed);
+            if (task.signupUrl === undefined &&
+                !usedKnownFullUrl &&
+                !(await this.looksLikeSignupPage())) {
                 steps.push(`${guessed} didn't look like a signup page — searching for the real one`);
                 const fallbackSearch = `https://www.google.com/search?q=${encodeURIComponent(`${task.service} signup`)}`;
                 await this.browser.goto(fallbackSearch);
-                await this.browser.wait(2);
+                // PERF: domcontentloaded from goto() + findSignupLink reads
+                // the DOM itself — no blind dwell needed.
                 signupUrl = fallbackSearch;
             }
             if (signupUrl !== guessed || isGoogleSearchUrl(signupUrl)) {
@@ -1401,7 +1665,26 @@ export class SignupAgent {
                     await this.runPrewarm(found, steps);
                     steps.push(`Found signup link: ${found}`);
                     await this.browser.goto(found);
-                    await this.browser.wait(2);
+                    // PERF: planner loop's waitForFormReady is next; no dwell.
+                }
+                else {
+                    // BUG-1 GUARD: findSignupLink filters off-domain candidates
+                    // (registered-domain match against the service slug). If
+                    // nothing remained AND we'd been sent here from a Google
+                    // fallback, the bot is sitting on a SERP with no usable
+                    // destination — abort rather than let the form-fill planner
+                    // happily fill the Google search box.
+                    if (isGoogleSearchUrl(signupUrl)) {
+                        return {
+                            success: false,
+                            error: `no_signup_link: searched for ${task.service}'s signup page and ` +
+                                `found no on-domain candidates. The service likely doesn't have ` +
+                                `a public self-serve signup, or the bot's domain guard rejected ` +
+                                `every match. Sign up manually.`,
+                            steps,
+                            ...this.resultTail(),
+                        };
+                    }
                 }
             }
             // Steps 2-5: plan the form, fill it, submit — via the
@@ -1543,7 +1826,10 @@ export class SignupAgent {
                             if (verifyLink !== null) {
                                 steps.push(`Following verification link: ${verifyLink}`);
                                 await this.browser.goto(verifyLink);
-                                await this.browser.wait(3);
+                                // PERF: a 1s settle is enough for the verify landing
+                                // page to commit cookies + render the post-verify
+                                // dashboard. Previous 3s was over-cautious.
+                                await this.browser.wait(1);
                                 await saveDebugSnapshot(this.browser, "after-verify");
                                 // Try extracting first — many services drop the API key
                                 // straight onto the landing page after verification.
@@ -1924,7 +2210,7 @@ Output rules:
   7-15 char handle.`;
         const hintLine = input.hint !== undefined ? `\nHint: ${input.hint}` : "";
         const userBlocks = [
-            { kind: "image", media_type: "image/png", data_base64: input.screenshot },
+            { kind: "image", media_type: "image/jpeg", data_base64: input.screenshot },
             {
                 kind: "text",
                 text: `Service: ${input.service}
@@ -2046,8 +2332,11 @@ ${formatInventory(input.inventory)}`,
             let state;
             let inventory;
             try {
-                state = await this.browser.getState();
-                inventory = await this.buildInventory(args.steps, undefined, 80);
+                // PERF: parallel getState + inventory (independent calls).
+                [state, inventory] = await Promise.all([
+                    this.browser.getState(),
+                    this.buildInventory(args.steps, undefined, 80),
+                ]);
             }
             catch (err) {
                 args.steps.push(`Post-verify round ${round}: page was mid-navigation ` +
@@ -2090,10 +2379,12 @@ ${formatInventory(input.inventory)}`,
                 continue;
             }
             args.steps.push(`Post-verify ${round + 1}/${args.maxRounds}: ${nextStep.kind} — ${nextStep.reason}`);
-            // Dev-only (env-gated): dump this round's real page state +
-            // inventory into the E1 eval-corpus format, so onboarding
-            // adapters can be iterated offline without re-running the
-            // rate-limited OAuth handshake.
+            // Dump this round's real page state + inventory in the E1
+            // eval-corpus format so onboarding adapters can be iterated
+            // offline without re-running the rate-limited OAuth handshake.
+            // Default-on as of 0.6.14-rc.11 — writes to
+            // ~/.trusty-squire/corpus/onboarding/ unless an env override
+            // points elsewhere or disables it.
             captureOnboardingRound({
                 service: args.service,
                 round,
@@ -2102,6 +2393,34 @@ ${formatInventory(input.inventory)}`,
                 inventory,
                 observed: nextStep,
             });
+            // Per-round telemetry upload (rc.11). Mirrors the disk capture
+            // but ships to the registry so debugging works from any host —
+            // the bot may be running in Goose or a sibling agent that
+            // doesn't share a filesystem with whoever's diagnosing the run.
+            // Fire-and-forget; failures must never abort the loop.
+            if (this.roundUploader !== undefined) {
+                const observedReason = "reason" in nextStep ? nextStep.reason : "";
+                void (async () => {
+                    try {
+                        await this.roundUploader({
+                            service: args.service,
+                            round,
+                            kind: nextStep.kind,
+                            url: state.url,
+                            title: state.title,
+                            inventory_count: inventory.length,
+                            observed_reason: observedReason,
+                            html: state.html,
+                            ...(state.screenshot !== undefined && state.screenshot.length > 0
+                                ? { screenshot_jpeg_base64: state.screenshot }
+                                : {}),
+                        });
+                    }
+                    catch {
+                        // best-effort — telemetry upload is diagnostic, never load-bearing
+                    }
+                })();
+            }
             // Stuck-loop detector. Re-planning steps (done/extract/login/
             // wait/navigate) are exempt: extract is its own progress signal,
             // navigate intentionally changes the URL not the current DOM,
@@ -2141,6 +2460,40 @@ ${formatInventory(input.inventory)}`,
                     const emptyInputHint = emptyInputs.length > 0
                         ? `\n\nVisible empty inputs on this page (any of these is a likely required field):\n${emptyInputs.join("\n")}\n\nIssue {"kind":"fill"} on one of them with a sensible value.`
                         : "";
+                    // Defaulted <select>s — value="" means the first <option>
+                    // (typically "Select…", "No workspace", "Choose…") is still
+                    // showing. React Hook Form treats those as untouched and
+                    // silently rejects submits. The Railway token-create form
+                    // was the canonical case: the Workspace dropdown's "No
+                    // workspace" placeholder was visually selected, but its
+                    // value="" left React state undefined, so Create did
+                    // nothing. Surface them explicitly so the planner emits a
+                    // select step before another click.
+                    const defaultedSelects = inventory
+                        .filter((e) => e.tag === "select" &&
+                        e.value !== null &&
+                        e.value !== undefined &&
+                        e.value.length === 0 &&
+                        e.selectOptions !== null &&
+                        e.selectOptions !== undefined &&
+                        e.selectOptions.length > 1 &&
+                        // rc.17 — skip selects we've already touched; their
+                        // form state is committed even though the visible
+                        // value="" still trips the DEFAULTED heuristic.
+                        e.interactedThisRun !== true)
+                        .slice(0, 5)
+                        .map((e) => {
+                        const label = e.labelText ?? e.ariaLabel ?? e.name ?? e.placeholder ?? "(no label)";
+                        // Show the first non-empty-value option as the suggested
+                        // pick — the obvious target when the planner doesn't
+                        // have a domain reason to prefer a specific one.
+                        const realOptions = (e.selectOptions ?? []).filter((o) => o.value.length > 0 && o.text.length > 0);
+                        const firstReal = realOptions[0]?.text ?? "(none)";
+                        return `  - ${JSON.stringify(label)} → selector=${e.selector} (first real option: ${JSON.stringify(firstReal)})`;
+                    });
+                    const defaultedSelectHint = defaultedSelects.length > 0
+                        ? `\n\nVisible DEFAULTED dropdowns on this page (value="" — React form-state likely treats these as UNTOUCHED, which silently fails submit):\n${defaultedSelects.join("\n")}\n\nIssue {"kind":"select", "option_text":"…"} to commit a choice. Even if the default visible label ("No workspace", "None") is what you want, you MUST emit the select step to register it with the form's state.`
+                        : "";
                     args.steps.push(sameSelector
                         ? `Post-verify: no-progress detected — same ${nextStep.kind} on same selector, inventory unchanged. Re-planning instead of re-running.`
                         : `Post-verify: no-progress detected — successive click steps with no inventory change. Forcing a non-click action.`);
@@ -2152,7 +2505,8 @@ ${formatInventory(input.inventory)}`,
                             `DIFFERENT KIND: {"kind":"fill"} on any empty text input, {"kind":"check"} on ` +
                             `any unticked checkbox, {"kind":"select"} on any unselected dropdown, or ` +
                             `{"kind":"done"} if there is genuinely nothing to do.` +
-                            emptyInputHint;
+                            emptyInputHint +
+                            defaultedSelectHint;
                     prevSignature = signature;
                     prevInventorySize = inventory.length;
                     continue;
@@ -2175,6 +2529,33 @@ ${formatInventory(input.inventory)}`,
                     credentials = await this.extractCredentials();
                     if (credentials.api_key === undefined) {
                         consecutiveFailedExtracts += 1;
+                        // Best-effort diagnostic upload: when extract returns
+                        // null despite the planner asserting a credential is
+                        // visible, capture the DOM + screenshot so the UI shape
+                        // can be inspected later. Wrapped tight — any failure
+                        // here MUST NOT abort the post-verify loop.
+                        if (this.extractFailureUploader !== undefined) {
+                            void (async () => {
+                                try {
+                                    const snapshot = await this.browser.getState();
+                                    const candidates = await this.browser.extractCredentialCandidates();
+                                    await this.extractFailureUploader({
+                                        service: this.currentService,
+                                        url: snapshot.url,
+                                        title: snapshot.title,
+                                        step_label: `post-verify round ${round + 1}/${args.maxRounds}: extract`,
+                                        extract_reason: nextStep.reason,
+                                        candidates,
+                                        html: snapshot.html,
+                                        screenshot_jpeg_base64: snapshot.screenshot,
+                                    });
+                                    args.steps.push(`Diagnostic: uploaded extract-failure snapshot (post-verify round ${round + 1}).`);
+                                }
+                                catch {
+                                    // Silent — diagnostic uploads are best-effort.
+                                }
+                            })();
+                        }
                         // Two consecutive failed extracts on a DOM the planner
                         // keeps quoting a token from means the value's shape is
                         // not in our regex library (Railway: bare UUID; some
@@ -2260,7 +2641,7 @@ ${formatInventory(input.inventory)}`,
                 }
                 else if (nextStep.kind === "navigate") {
                     await this.browser.goto(nextStep.url);
-                    await this.browser.wait(3);
+                    // PERF: next round opens with waitForFormReady; no blind dwell.
                 }
                 else if (nextStep.kind === "wait") {
                     await this.browser.wait(Math.min(nextStep.seconds, 15));
@@ -2288,12 +2669,74 @@ ${formatInventory(input.inventory)}`,
             }
             // Re-extract — but tolerate the page still navigating from the
             // step just taken; the next round settles and re-reads.
+            const hadCredentialsBefore = credentials.api_key !== undefined || credentials.username !== undefined;
             try {
                 credentials = await this.extractCredentials();
             }
             catch {
                 // page mid-navigation — next round's waitForFormReady handles it
             }
+            // rc.16 — synthetic extract round capture. When the implicit
+            // extractCredentials() above pulls a credential out of the page
+            // *without* the planner ever having picked an `extract` step,
+            // the for-loop's early-return at the next iteration's top fires
+            // before any further capture is written. The chain that
+            // auto-promote sees then has no `observed.kind === "extract"`
+            // round, so promoteToSkill rejects with no_extract_step. Fix:
+            // when an implicit extract just succeeded and the planner's
+            // chosen step this round wasn't already `extract`, write a
+            // synthetic extract round with fresh state+inventory captured
+            // RIGHT NOW (the action just ran, the token row is now visible).
+            // Best-effort — a capture failure must never block returning the
+            // credential we already have.
+            const haveNewCredentials = !hadCredentialsBefore &&
+                (credentials.api_key !== undefined || credentials.username !== undefined);
+            if (haveNewCredentials && nextStep.kind !== "extract") {
+                try {
+                    const [postState, postInventory] = await Promise.all([
+                        this.browser.getState(),
+                        this.buildInventory(args.steps, undefined, 80),
+                    ]);
+                    const syntheticExtract = {
+                        kind: "extract",
+                        reason: `implicit extract after ${nextStep.kind} — credentials surfaced on the page`,
+                    };
+                    captureOnboardingRound({
+                        service: args.service,
+                        round: round + 1,
+                        oauth,
+                        state: postState,
+                        inventory: postInventory,
+                        observed: syntheticExtract,
+                    });
+                    if (this.roundUploader !== undefined) {
+                        void (async () => {
+                            try {
+                                await this.roundUploader({
+                                    service: args.service,
+                                    round: round + 1,
+                                    kind: syntheticExtract.kind,
+                                    url: postState.url,
+                                    title: postState.title,
+                                    inventory_count: postInventory.length,
+                                    observed_reason: syntheticExtract.reason,
+                                    html: postState.html,
+                                    ...(postState.screenshot !== undefined && postState.screenshot.length > 0
+                                        ? { screenshot_jpeg_base64: postState.screenshot }
+                                        : {}),
+                                });
+                            }
+                            catch {
+                                // best-effort
+                            }
+                        })();
+                    }
+                }
+                catch {
+                    // best-effort — synthetic capture is auto-promote plumbing,
+                    // never load-bearing for the parent signup
+                }
+            }
         }
         return credentials;
     }
@@ -2389,14 +2832,16 @@ ${loginGuidance}
 - If a "Create"/"Continue" button is disabled, look for a required terms-of-service / agreement checkbox and tick it with {"kind":"check"} — use the checkbox's own inventory selector (an entry with type=checkbox), NOT the adjacent "Terms of Service" link. A "click" on a styled checkbox often fails to flip it; use "check".
 - If an Accept / Agree / Continue button is DISABLED and the page shows a ToS / agreement modal (a long scrollable block of legal text, often inside a dialog), AND there is no agreement checkbox in the inventory to tick, return {"kind":"scroll"}. Some services (Railway is the canonical case) only enable the Accept button after the user scrolls the modal body to the bottom. The bot auto-detects the scrollable container — you do NOT need a selector. Do NOT use "click" to try to scroll; "click" does not scroll, it lands a click and returns. After scrolling, the next round should re-read the page and click the now-enabled Accept button (which will appear in the inventory).
 - Prefer the simplest credential path: a project- or organization-level API token / auth token usually needs only a name. A "personal token" with a grid of per-scope permission dropdowns is more work — choose it only if no simpler token type is offered.
+- **Token names must be unique within the account.** Many services (Railway is the canonical case) silently reject submits whose name collides with an existing token — the click registers, the button takes focus, but no token is created and no error toast is shown. Before filling a token-name input, READ the visible existing-tokens list on the page (names like "mykey", "mytoken123", any others). For the name you fill, prefer a fresh unique name like \`ts-<random>\` or \`agent-<short-suffix>\`; NEVER reuse a name that appears in the existing list — including names with sequential suffixes like \`mykey2\`, \`mykey3\` if the un-suffixed name is also present (assume the user has been iterating). If you cannot see the existing-tokens list (it scrolled off, the page hides it), pick a name with high entropy (8+ random alphanumeric chars).
 - On a token-creation form whose permission/scope dropdowns default to "No Access" / "None", you MUST set permissions BEFORE clicking the create button.
+- **Defaulted dropdowns (value="") gate submit, even when the visible label looks fine.** An inventory line marked \`(DEFAULTED — pick an explicit option before submitting)\` means a \`<select>\` is showing its first option visually but its underlying value is empty. React-form-state libraries (React Hook Form, Formik) treat those as UNTOUCHED and reject submits silently — the click on the submit button visually focuses it but no submission occurs. Issue \`{"kind":"select", "option_text":"…"}\` to commit a choice BEFORE clicking submit, even if the existing visible label ("No workspace", "None", "Select…") is the option you want. The Railway token-create form was the canonical case: typing the name and clicking Create did nothing for six rounds because the Workspace dropdown was never explicitly selected.
 - **PERMISSION SCOPE — default is MAXIMUM.** ${input.scopeHint !== undefined
             ? `The user provided a scope hint: "${input.scopeHint}". Pick option_text values aligned with this on each permission dropdown.`
             : `No scope hint was provided. Default to the HIGHEST available permission level on EVERY permission dropdown (Admin > Write > Read > anything lower). Most agent use-cases need write access; a read-only token will fail downstream when the agent tries to push data. Set "Admin" if offered; "Write" otherwise. Explicitly use option_text to specify — do NOT rely on first-option behavior, which often picks Read.`}
 - On a form with MULTIPLE permission rows (Sentry: Project, Team, Member, Issue, Event, Release, Organization), set EACH ONE before clicking Create. One step per turn — return to this turn-by-turn until every row is set.
 - Round ${input.round + 1} of ${input.maxRounds}. Prefer "done" if you're not making progress.`;
         const userBlocks = [
-            { kind: "image", media_type: "image/png", data_base64: input.state.screenshot },
+            { kind: "image", media_type: "image/jpeg", data_base64: input.state.screenshot },
             {
                 kind: "text",
                 text: `Service: ${input.service}
@@ -2496,6 +2941,16 @@ ${formatInventory(input.inventory)}${input.hint !== undefined ? `\n\nIMPORTANT
             // Negative: signin/login/logout in host+path.
             if (/(?:^|\/)(?:signin|login|logout|sign-in|log-in)\b/.test(hostPath))
                 continue;
+            // BUG-1 GUARD: registered-domain match against the target service.
+            // Without this, a Google search for "Railway signup" returned a
+            // link to storysite-production.up.railway.app/signup/ — somebody's
+            // hobby Django app hosted on Railway — and the bot filled out the
+            // form, creating a junk account on the wrong website. PSL-aware
+            // eTLD+1 comparison handles platform suffixes like .up.railway.app
+            // and .vercel.app (where each customer subdomain is its own
+            // "registered" entity) correctly.
+            if (!hostMatchesServiceDomain(url.hostname, serviceSlug))
+                continue;
             // Score: a host containing the service slug is a strong match.
             // Without a slug to compare against, every match scores 1.
             const hostLower = url.hostname.toLowerCase();
@@ -2639,6 +3094,38 @@ ${formatInventory(input.inventory)}${input.hint !== undefined ? `\n\nIMPORTANT
                 // with whatever we had (or null).
             }
         }
+        // Pass 4 — Copy-button colocation scan. Railway's "New Token"
+        // modal shows the UUID inside a <code> built character-by-span,
+        // which Pass 1's direct-text walk can't reassemble. Walk every
+        // visible "Copy" affordance's ancestor subtree, tokenize its
+        // innerText, and accept the first token that looks like a
+        // credential. Strict on shape (length 16-256, isolated token)
+        // to avoid false positives on copy-blog-post-link buttons.
+        if (apiKey === null) {
+            try {
+                const UUID_RE = /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;
+                for (const candidate of await this.browser.extractCredentialsNearCopyButtons()) {
+                    // The candidate is a bare whitespace-isolated token. If it's
+                    // a UUID, accept it directly — the Copy-button colocation
+                    // is the credential signal we'd otherwise demand a textual
+                    // "api key" label for.
+                    if (UUID_RE.test(candidate)) {
+                        apiKey = candidate;
+                        break;
+                    }
+                    // Otherwise route through the normal extractor — accepts
+                    // gh*_*, sk_*, pk_*, Stripe/AWS-style prefixes, JWTs, etc.
+                    const hit = extractApiKeyFromText(candidate);
+                    if (hit !== null && !isTruncatedCapture(candidate, hit)) {
+                        apiKey = hit;
+                        break;
+                    }
+                }
+            }
+            catch {
+                // Non-fatal — leave apiKey as null and fall through.
+            }
+        }
         // Last resort: if every path returned a truncated value, persist
         // it with a `_truncated` suffix so the host agent can surface the
         // partial result to the user (better than reporting "no key