npm - imprint-mcp - Versions diffs - 0.2.1 → 0.3.1 - Mend

imprint-mcp 0.2.1 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

package/README.md +193 -189
package/examples/discoverandgo/README.md +1 -1
package/examples/echo/README.md +1 -1
package/examples/google-flights/README.md +28 -0
package/examples/google-flights/_shared/batchexecute.ts +63 -0
package/examples/google-flights/_shared/flights_request.ts +95 -0
package/examples/google-flights/_shared/package.json +9 -0
package/examples/google-flights/get_flight_booking_details/index.ts +159 -0
package/examples/google-flights/get_flight_booking_details/package.json +9 -0
package/examples/google-flights/get_flight_booking_details/parser.ts +182 -0
package/examples/google-flights/get_flight_booking_details/playbook.yaml +138 -0
package/examples/google-flights/get_flight_booking_details/request-transform.ts +86 -0
package/examples/google-flights/get_flight_booking_details/workflow.json +98 -0
package/examples/google-flights/get_flight_calendar_prices/index.ts +131 -0
package/examples/google-flights/get_flight_calendar_prices/package.json +9 -0
package/examples/google-flights/get_flight_calendar_prices/parser.ts +86 -0
package/examples/google-flights/get_flight_calendar_prices/playbook.yaml +97 -0
package/examples/google-flights/get_flight_calendar_prices/request-transform.ts +31 -0
package/examples/google-flights/get_flight_calendar_prices/workflow.json +78 -0
package/examples/google-flights/lookup_airport/index.ts +101 -0
package/examples/google-flights/lookup_airport/package.json +9 -0
package/examples/google-flights/lookup_airport/parser.ts +66 -0
package/examples/google-flights/lookup_airport/playbook.yaml +47 -0
package/examples/google-flights/lookup_airport/request-transform.ts +20 -0
package/examples/google-flights/lookup_airport/workflow.json +57 -0
package/examples/google-flights/search_flights/index.ts +219 -0
package/examples/google-flights/search_flights/package.json +9 -0
package/examples/google-flights/search_flights/parser.ts +169 -0
package/examples/google-flights/search_flights/playbook.yaml +184 -0
package/examples/google-flights/search_flights/request-transform.ts +119 -0
package/examples/google-flights/search_flights/workflow.json +143 -0
package/examples/google-hotels/README.md +29 -0
package/examples/google-hotels/_shared/batchexecute.ts +73 -0
package/examples/google-hotels/_shared/freq.ts +158 -0
package/examples/google-hotels/_shared/package.json +9 -0
package/examples/google-hotels/autocomplete_hotel_location/index.ts +80 -0
package/examples/google-hotels/autocomplete_hotel_location/package.json +9 -0
package/examples/google-hotels/autocomplete_hotel_location/parser.ts +71 -0
package/examples/google-hotels/autocomplete_hotel_location/playbook.yaml +36 -0
package/examples/google-hotels/autocomplete_hotel_location/request-transform.ts +37 -0
package/examples/google-hotels/autocomplete_hotel_location/workflow.json +36 -0
package/examples/google-hotels/get_hotel_booking_options/index.ts +143 -0
package/examples/google-hotels/get_hotel_booking_options/package.json +9 -0
package/examples/google-hotels/get_hotel_booking_options/parser.ts +271 -0
package/examples/google-hotels/get_hotel_booking_options/playbook.yaml +154 -0
package/examples/google-hotels/get_hotel_booking_options/request-transform.ts +154 -0
package/examples/google-hotels/get_hotel_booking_options/workflow.json +84 -0
package/examples/google-hotels/get_hotel_reviews/index.ts +81 -0
package/examples/google-hotels/get_hotel_reviews/package.json +9 -0
package/examples/google-hotels/get_hotel_reviews/parser.ts +128 -0
package/examples/google-hotels/get_hotel_reviews/playbook.yaml +64 -0
package/examples/google-hotels/get_hotel_reviews/request-transform.ts +42 -0
package/examples/google-hotels/get_hotel_reviews/workflow.json +37 -0
package/examples/google-hotels/search_hotels/index.ts +207 -0
package/examples/google-hotels/search_hotels/package.json +9 -0
package/examples/google-hotels/search_hotels/parser.ts +260 -0
package/examples/google-hotels/search_hotels/playbook.yaml +87 -0
package/examples/google-hotels/search_hotels/request-transform.ts +197 -0
package/examples/google-hotels/search_hotels/workflow.json +127 -0
package/examples/southwest/README.md +3 -2
package/examples/southwest/search_southwest_flights/index.ts +18 -1
package/examples/southwest/search_southwest_flights/workflow.json +18 -1
package/package.json +3 -2
package/prompts/audit-agent.md +71 -0
package/prompts/build-planning.md +74 -0
package/prompts/compile-agent.md +131 -27
package/prompts/prereq-builder.md +64 -0
package/prompts/prereq-planner.md +34 -0
package/prompts/tool-planning.md +39 -0
package/src/cli.ts +116 -3
package/src/imprint/agent.ts +5 -0
package/src/imprint/audit.ts +996 -0
package/src/imprint/backend-ladder.ts +1214 -184
package/src/imprint/build-plan.ts +1051 -0
package/src/imprint/cdp-browser-fetch.ts +592 -0
package/src/imprint/cdp-jar-cache.ts +320 -0
package/src/imprint/chromium.ts +414 -8
package/src/imprint/claude-cli-compile.ts +125 -25
package/src/imprint/codex-cli-compile.ts +26 -23
package/src/imprint/compile-agent-types.ts +38 -0
package/src/imprint/compile-agent.ts +63 -25
package/src/imprint/compile-tools.ts +1666 -66
package/src/imprint/compile.ts +13 -1
package/src/imprint/concurrency.ts +87 -0
package/src/imprint/cron.ts +4 -0
package/src/imprint/doctor.ts +48 -3
package/src/imprint/freeform-redact.ts +5 -4
package/src/imprint/install.ts +79 -4
package/src/imprint/integrations.ts +3 -3
package/src/imprint/llm.ts +56 -8
package/src/imprint/mcp-compile-server.ts +43 -10
package/src/imprint/mcp-maintenance.ts +18 -102
package/src/imprint/mcp-server.ts +73 -7
package/src/imprint/multi-progress.ts +7 -2
package/src/imprint/param-grounding.ts +367 -0
package/src/imprint/paths.ts +29 -0
package/src/imprint/playbook-runner.ts +101 -40
package/src/imprint/prereq-builder.ts +651 -0
package/src/imprint/probe-backends.ts +6 -3
package/src/imprint/record.ts +10 -1
package/src/imprint/redact.ts +30 -2
package/src/imprint/replay-capture.ts +19 -18
package/src/imprint/runtime.ts +19 -10
package/src/imprint/session-diff.ts +79 -2
package/src/imprint/session-merge.ts +9 -5
package/src/imprint/stealth-chromium.ts +79 -0
package/src/imprint/stealth-fetch.ts +309 -29
package/src/imprint/stealth-token-cache.ts +88 -0
package/src/imprint/teach-plan.ts +251 -0
package/src/imprint/teach-state.ts +10 -0
package/src/imprint/teach.ts +456 -142
package/src/imprint/tool-candidates.ts +72 -14
package/src/imprint/tool-plan.ts +313 -0
package/src/imprint/tracing.ts +135 -6
package/src/imprint/types.ts +61 -3
package/examples/google-flights/search_google_flights/index.ts +0 -101
package/examples/google-flights/search_google_flights/parser.test.ts +0 -140
package/examples/google-flights/search_google_flights/parser.ts +0 -189
package/examples/google-flights/search_google_flights/playbook.yaml +0 -130
package/examples/google-flights/search_google_flights/workflow.json +0 -48
package/examples/google-hotels/search_google_hotels/index.ts +0 -194
package/examples/google-hotels/search_google_hotels/parser.test.ts +0 -168
package/examples/google-hotels/search_google_hotels/parser.ts +0 -330
package/examples/google-hotels/search_google_hotels/playbook.yaml +0 -125
package/examples/google-hotels/search_google_hotels/workflow.json +0 -111
package/examples/namecheap-domains/search_namecheap_domains/index.ts +0 -144
package/examples/namecheap-domains/search_namecheap_domains/parser.ts +0 -380
package/examples/namecheap-domains/search_namecheap_domains/playbook.yaml +0 -50
package/examples/namecheap-domains/search_namecheap_domains/request-transform.ts +0 -136
package/examples/namecheap-domains/search_namecheap_domains/workflow.json +0 -97

package/src/imprint/param-grounding.ts ADDED Viewed

@@ -0,0 +1,367 @@
+/**
+ * Event-correlated differential param grounding.
+ *
+ * The candidate detector reliably identifies WHICH inputs the user controlled
+ * (`likelyParams`) and WHICH events toggled them (`eventSeqs`) — but the compile
+ * agent historically grounded a param by eyeballing a single request, and when
+ * the value wasn't obviously present it gave up and shipped the param
+ * `verified:false`, inert. Yet the encoding is almost always right there: the
+ * request a filter-toggle event triggers differs from the prior equivalent
+ * request at exactly the position that param controls.
+ *
+ * This module makes that differential deterministic and site-agnostic: for each
+ * UI event, find the request it triggered, diff it against the most recent
+ * comparable request (same endpoint), and report the changed paths. The compile
+ * agent (and the precomputed hint surfaced to it) then maps each diff to a
+ * `likelyParam` — the semantic step the model is good at — instead of guessing
+ * at an encoding. Decoding is generic (JSON body, an `f.req=`-embedded JSON
+ * envelope as used by Google's batchexecute, or plain form fields), so this is
+ * not specific to any one site.
+ */
+import type { CapturedRequest, Session } from './types.ts';
+interface GroundingChange {
+  /** JSON path into the decoded request body, e.g. "[1][4][3]". */
+  path: string;
+  before: string;
+  after: string;
+}
+interface EventGrounding {
+  eventSeq: number;
+  /** Human label from the event detail (button text / aria-label / id). */
+  label: string;
+  /** The request the event triggered (first comparable request after it). */
+  triggeredSeq?: number;
+  /** The prior request of the same endpoint that the diff is taken against. */
+  priorSeq?: number;
+  endpoint?: string;
+  changes: GroundingChange[];
+}
+/** First request after `eventSeq`, within a window, that has a decodable body. */
+const TRIGGER_WINDOW = 12;
+/** Decode a request body into a comparable structure. Handles, in order:
+ *  a raw JSON body; an `f.req=<json>` form field whose value is a JSON envelope
+ *  (batchexecute) — unwrapping `[[["rpcid","<inner-json-string>",…]]]` to the
+ *  inner payload when present; otherwise a flat form-field map; else the raw
+ *  string. Never throws. */
+export function decodeBodyForDiff(body: string | undefined): unknown {
+  if (!body) return undefined;
+  const trimmed = body.trim();
+  if (trimmed.startsWith('{') || trimmed.startsWith('[')) {
+    try {
+      return JSON.parse(trimmed);
+    } catch {
+      /* not JSON */
+    }
+  }
+  // form-encoded?
+  if (/(^|&)[\w.]+=/.test(trimmed)) {
+    const params = new URLSearchParams(trimmed);
+    const freq = params.get('f.req');
+    if (freq != null) {
+      try {
+        const env = JSON.parse(freq);
+        // batchexecute envelope: [[["rpcid","<inner json string>", …]]]
+        const innerStr = env?.[0]?.[0]?.[1];
+        if (typeof innerStr === 'string') {
+          try {
+            return JSON.parse(innerStr);
+          } catch {
+            return env;
+          }
+        }
+        return env;
+      } catch {
+        /* f.req not JSON */
+      }
+    }
+    const out: Record<string, string> = {};
+    for (const [k, v] of params) out[k] = v;
+    return out;
+  }
+  return trimmed;
+}
+/** Deep structural diff → changed leaf paths (a→b). Identical subtrees are
+ *  skipped via a cheap stringify equality check. */
+export function structuralDiff(
+  a: unknown,
+  b: unknown,
+  path = '',
+  out: GroundingChange[] = [],
+): GroundingChange[] {
+  if (JSON.stringify(a) === JSON.stringify(b)) return out;
+  if (Array.isArray(a) && Array.isArray(b)) {
+    const n = Math.max(a.length, b.length);
+    for (let i = 0; i < n; i++) structuralDiff(a[i], b[i], `${path}[${i}]`, out);
+    return out;
+  }
+  if (a && b && typeof a === 'object' && typeof b === 'object') {
+    const keys = new Set([...Object.keys(a as object), ...Object.keys(b as object)]);
+    for (const k of keys) {
+      structuralDiff(
+        (a as Record<string, unknown>)[k],
+        (b as Record<string, unknown>)[k],
+        path ? `${path}.${k}` : k,
+        out,
+      );
+    }
+    return out;
+  }
+  const cap = (v: unknown) => {
+    const s = v === undefined ? 'undefined' : JSON.stringify(v);
+    return s.length > 48 ? `${s.slice(0, 48)}…` : s;
+  };
+  out.push({ path: path || '(root)', before: cap(a), after: cap(b) });
+  return out;
+}
+/** A stable key grouping "comparable" requests: the batchexecute rpcid when
+ *  present, else METHOD + URL path (query stripped). */
+function endpointKey(req: CapturedRequest): string {
+  const url = req.url ?? '';
+  // Accept both `rpcids=` (Google batchexecute, plural) and a singular `rpcid=`
+  // in the URL query, matching tool-candidates' endpoint-family keying — so a
+  // batchexecute-style endpoint never collapses distinct rpcs to one path key.
+  const rpc = /[?&]rpcids?=([^&]+)/.exec(url);
+  if (rpc) return `rpc:${decodeURIComponent(rpc[1] ?? '')}`;
+  try {
+    const u = new URL(url);
+    return `${req.method ?? 'GET'} ${u.pathname}`;
+  } catch {
+    return `${req.method ?? 'GET'} ${url.split('?')[0]}`;
+  }
+}
+function bodyOf(req: CapturedRequest): string | undefined {
+  // CapturedRequest stores the request body on `.body`; tolerate alt shapes.
+  return (
+    (req as unknown as { body?: string }).body ??
+    (req as unknown as { requestBody?: string }).requestBody ??
+    undefined
+  );
+}
+function eventLabel(detail: string): string {
+  let d: Record<string, unknown> = {};
+  try {
+    d = JSON.parse(detail);
+  } catch {
+    return detail.slice(0, 48);
+  }
+  const txt = (d.text ?? d.ariaLabel ?? d.name ?? d.id ?? '') as string;
+  return String(txt).replace(/\s+/g, ' ').trim().slice(0, 48);
+}
+/** Telemetry/beacon endpoints that fire constantly and are never the tool's
+ *  load-bearing request — excluded when we can't scope to the candidate's own
+ *  endpoints. */
+const TELEMETRY = /\/(log|gen_204|jserror|ping|beacon|csi|_\/bscframe|metrics|stats)\b/i;
+/** A decoded body worth diffing: a structured array/object, not a raw (often
+ *  gzipped/opaque) string. */
+function isStructured(v: unknown): boolean {
+  return v != null && typeof v === 'object';
+}
+/** Ground a single event: find the request it triggered and diff against the
+ *  most recent prior request of the same endpoint.
+ *
+ *  `relevantEndpoints` (the candidate's own request endpoints, via endpointKey)
+ *  scopes the search to the tool's load-bearing requests — without it a burst of
+ *  telemetry POSTs between the click and the real request would be mistaken for
+ *  the trigger. */
+export function groundEvent(
+  session: Session,
+  eventSeq: number,
+  relevantEndpoints?: Set<string>,
+): EventGrounding {
+  const reqs = [...session.requests].sort((a, b) => a.seq - b.seq);
+  const ev = session.events.find((e) => e.seq === eventSeq);
+  const label = ev ? eventLabel(ev.detail) : '';
+  const triggered = reqs.find((r) => {
+    if (r.seq <= eventSeq || r.seq > eventSeq + windowEnd(reqs, eventSeq)) return false;
+    const decoded = decodeBodyForDiff(bodyOf(r));
+    if (decoded === undefined) return false;
+    if (relevantEndpoints && relevantEndpoints.size > 0)
+      return relevantEndpoints.has(endpointKey(r));
+    // Fallback: structured body + not an obvious telemetry endpoint.
+    return isStructured(decoded) && !TELEMETRY.test(r.url ?? '');
+  });
+  if (!triggered) return { eventSeq, label, changes: [] };
+  const key = endpointKey(triggered);
+  const prior = [...reqs]
+    .reverse()
+    .find(
+      (r) =>
+        r.seq < triggered.seq &&
+        endpointKey(r) === key &&
+        decodeBodyForDiff(bodyOf(r)) !== undefined,
+    );
+  const changes = prior
+    ? structuralDiff(decodeBodyForDiff(bodyOf(prior)), decodeBodyForDiff(bodyOf(triggered)))
+    : [];
+  return {
+    eventSeq,
+    label,
+    triggeredSeq: triggered.seq,
+    priorSeq: prior?.seq,
+    endpoint: key,
+    changes,
+  };
+}
+/** Window end: don't scan unboundedly — cap at TRIGGER_WINDOW requests past the
+ *  event (by seq distance to the Nth following request). */
+function windowEnd(reqs: CapturedRequest[], eventSeq: number): number {
+  const after = reqs.filter((r) => r.seq > eventSeq).slice(0, TRIGGER_WINDOW);
+  const last = after.at(-1);
+  return last ? last.seq - eventSeq : TRIGGER_WINDOW;
+}
+/** Precompute grounding diffs for a candidate's filter-toggle events, dropping
+ *  events that triggered nothing or changed nothing.
+ *
+ *  Pass `relevantEndpoints` = endpointKey() of the candidate's own request seqs
+ *  so the diff is taken against the tool's load-bearing request, not telemetry. */
+export function groundingForEvents(
+  session: Session,
+  eventSeqs: number[],
+  relevantEndpoints?: Set<string>,
+): EventGrounding[] {
+  const all = eventSeqs
+    .map((seq) => groundEvent(session, seq, relevantEndpoints))
+    .filter((g) => g.changes.length > 0);
+  // Drop session-churn paths — positions that change across MOST events are
+  // per-call session state (rotating tokens, pagination flags, a display-mode
+  // value), not the param the event toggled. A param's encoding shows up only
+  // in the diff(s) of the event(s) that control it, so frequency cleanly
+  // separates signal from churn.
+  const pathFreq = new Map<string, number>();
+  for (const g of all) {
+    for (const p of new Set(g.changes.map((c) => c.path)))
+      pathFreq.set(p, (pathFreq.get(p) ?? 0) + 1);
+  }
+  const churnAt = Math.max(3, Math.ceil(all.length / 2));
+  for (const g of all) g.changes = g.changes.filter((c) => (pathFreq.get(c.path) ?? 0) < churnAt);
+  return all.filter((g) => g.changes.length > 0);
+}
+/** Derive the relevant-endpoint set from a candidate's request seqs. */
+export function endpointsForSeqs(session: Session, seqs: number[]): Set<string> {
+  const set = new Set<string>();
+  for (const seq of seqs) {
+    const r = session.requests.find((x) => x.seq === seq);
+    if (r) set.add(endpointKey(r));
+  }
+  return set;
+}
+// ─── Input-value provenance ──────────────────────────────────────────────────
+//
+// The grounding above covers params the user *toggled* (filters/sort). It does
+// not cover a primary param whose value is an opaque id the request can't carry
+// as plain text — e.g. an entity/object handle, an account id, a place/geo id, a
+// category token. The compile agent historically shipped these as the raw param
+// text, which the backend silently ignores and falls back to a default (an
+// unfiltered/global result set, or a server-chosen default scope). The id was
+// never the user's text; it was *minted by an earlier response* and chained into
+// the request. That cross-request data-flow is the signal this detects — keyed
+// on structure, not any vendor's id format.
+interface InputProvenance {
+  /** JSON path into the decoded request body where the minted value sits. */
+  path: string;
+  /** Example resolved value (truncated). Varies per call — the PATH is the signal. */
+  valueSample: string;
+  /** The candidate request that consumes the value. */
+  requestSeq: number;
+  /** Earliest earlier request whose RESPONSE first carried this value. */
+  sourceSeq: number;
+  sourceEndpoint: string;
+  /** True when the source is the tool's own endpoint (resolve-then-refine: an
+   *  initial text request whose response yields the id, re-sent as a refined
+   *  request carrying that id). */
+  selfChain: boolean;
+}
+/** An opaque, machine-minted identifier — not human-typed text. Vendor-agnostic:
+ *  keyed on structure (no whitespace, long enough, mixes character classes or is
+ *  a delimited handle), not on any specific id format. Excludes free text
+ *  (multi-word phrases, single dictionary words), ISO dates, and bare counts so
+ *  they never trip it, while still catching namespaced handles ("ns/abc123"),
+ *  hex ids, UUIDs, and base64-ish session handles. */
+function isIdLike(v: string): boolean {
+  if (/\s/.test(v)) return false; // free text has spaces
+  if (v.length < 6) return false; // too short to be an opaque handle
+  if (/^\d{4}-\d{2}-\d{2}([T ]|$)/.test(v)) return false; // ISO date / datetime
+  const hasLetter = /[A-Za-z]/.test(v);
+  const hasDigit = /\d/.test(v);
+  const hasIdPunct = /[/:_.+=~-]/.test(v); // namespaced / delimited handle
+  // Opaque if it mixes letters+digits (a token), or is a delimited handle that
+  // still carries an alphanumeric payload. A bare word or a pure number is not.
+  return (hasLetter && hasDigit) || (hasIdPunct && (hasLetter || hasDigit));
+}
+function responseBodyOf(req: CapturedRequest): string | undefined {
+  const b = (req as unknown as { response?: { body?: string } }).response?.body;
+  return typeof b === 'string' ? b : undefined;
+}
+function leafStrings(
+  v: unknown,
+  path = '',
+  out: { path: string; val: string }[] = [],
+): { path: string; val: string }[] {
+  if (Array.isArray(v)) {
+    v.forEach((x, i) => leafStrings(x, `${path}[${i}]`, out));
+  } else if (v && typeof v === 'object') {
+    for (const k of Object.keys(v as object))
+      leafStrings((v as Record<string, unknown>)[k], path ? `${path}.${k}` : k, out);
+  } else if (typeof v === 'string' && v.length >= 4) {
+    out.push({ path, val: v });
+  }
+  return out;
+}
+/** For each candidate request, find body positions holding an id-like value that
+ *  first appears in an EARLIER response — i.e. a value the request did not get
+ *  from the user's text but chained in from upstream. Deduped by endpoint+path
+ *  (the value varies per call; the position is the durable signal). */
+export function inputProvenance(session: Session, candidateSeqs: number[]): InputProvenance[] {
+  const reqs = [...session.requests].sort((a, b) => a.seq - b.seq);
+  const seen = new Set<string>();
+  const out: InputProvenance[] = [];
+  for (const seq of [...candidateSeqs].sort((a, b) => a - b)) {
+    const r = reqs.find((x) => x.seq === seq);
+    if (!r) continue;
+    const decoded = decodeBodyForDiff(bodyOf(r));
+    if (decoded == null || typeof decoded !== 'object') continue;
+    const ep = endpointKey(r);
+    for (const { path, val } of leafStrings(decoded)) {
+      if (!isIdLike(val)) continue;
+      const key = `${ep}|${path}`;
+      if (seen.has(key)) continue;
+      const src = reqs.find((x) => x.seq < seq && (responseBodyOf(x)?.includes(val) ?? false));
+      if (!src) continue; // not minted upstream → it IS the param's own text / a constant
+      seen.add(key);
+      out.push({
+        path,
+        valueSample: val.length > 40 ? `${val.slice(0, 40)}…` : val,
+        requestSeq: seq,
+        sourceSeq: src.seq,
+        sourceEndpoint: endpointKey(src),
+        selfChain: endpointKey(src) === ep,
+      });
+    }
+  }
+  return out;
+}

package/src/imprint/paths.ts CHANGED Viewed

@@ -38,6 +38,35 @@ export function localSessionsDir(site: string): string {
   return pathJoin(localSiteDir(site), 'sessions');
 }
+/** Default output path for `imprint audit <site>` — a per-site report sidecar
+ *  (`~/.imprint/<site>/.audit-report.json`). */
+export function localAuditReportPath(site: string): string {
+  return pathJoin(localSiteDir(site), '.audit-report.json');
+}
+/** Site-level directory for shared modules reused across a site's tools
+ *  (`~/.imprint/<site>/_shared`). Per-tool artifacts import these via the
+ *  relative path `../_shared/<name>.ts`. The tool loader and completed-workflow
+ *  discovery both skip `_shared` (it has no index.ts). */
+export function localSharedDir(site: string): string {
+  return pathJoin(localSiteDir(site), '_shared');
+}
+/** Resolve a shared-module relative path (e.g. "_shared/sign.ts" or "sign.ts")
+ *  to an absolute path under the site's shared dir, rejecting traversal. */
+export function localSharedModulePath(site: string, relPath: string): string {
+  if (relPath.includes('..') || relPath.startsWith('/') || relPath.includes('\\')) {
+    throw new Error(`Invalid shared module path: "${relPath}". Must not contain ".." or "/".`);
+  }
+  const base = relPath.startsWith('_shared/') ? relPath.slice('_shared/'.length) : relPath;
+  if (base.includes('/')) {
+    throw new Error(
+      `Invalid shared module path: "${relPath}". Must be a flat file under _shared/.`,
+    );
+  }
+  return pathJoin(localSharedDir(site), base);
+}
 export function defaultSessionJsonlPath(site: string, timestamp: string): string {
   return pathJoin(localSessionsDir(site), `${timestamp}.jsonl`);
 }

package/src/imprint/playbook-runner.ts CHANGED Viewed

@@ -12,6 +12,7 @@ import { createLog } from './log.ts';
 import { imprintHomeDir } from './paths.ts';
 import { parsePlaybook } from './playbook-parser.ts';
 import { substituteString } from './runtime.ts';
+import { getStealthChromium, getStealthExecutablePath } from './stealth-chromium.ts';
 import type {
   Locator,
   Playbook,
@@ -64,33 +65,24 @@ export async function runPlaybook(opts: RunPlaybookOptions): Promise<ToolResult>
   if (opts.pageOverride) {
     page = opts.pageOverride;
   } else {
-    // playwright-extra + stealth plugin patches navigator.webdriver,
-    // plugin enumeration, WebGL vendor strings, etc. Vanilla headless
-    // Playwright eats a 403 from any decent enterprise site (verified:
-    // Southwest 403 → 200 with stealth).
     let chromium: typeof import('playwright').chromium;
     try {
-      const pwExtra = await import('playwright-extra');
-      const stealthMod = await import('puppeteer-extra-plugin-stealth');
-      const stealthFactory =
-        (stealthMod as { default?: () => unknown }).default ??
-        (stealthMod as unknown as () => unknown);
-      pwExtra.chromium.use(stealthFactory() as never);
-      chromium = pwExtra.chromium as unknown as typeof import('playwright').chromium;
-    } catch {
-      try {
-        const pw = await import('playwright');
-        chromium = pw.chromium;
-      } catch (innerErr) {
-        return {
-          ok: false,
-          error: 'UNKNOWN',
-          message: `Playwright not available: ${errMsg(innerErr)}. Run: bunx playwright install chromium`,
-        };
-      }
+      chromium = await getStealthChromium();
+    } catch (innerErr) {
+      return {
+        ok: false,
+        error: 'UNKNOWN',
+        message: `Playwright not available: ${errMsg(innerErr)}. Run: bunx playwright install chromium`,
+      };
     }
     try {
-      browser = await chromium.launch({ headless: !opts.headed });
+      // Use the same full Chrome binary as `imprint record` — NOT
+      // chrome-headless-shell, which Akamai detects at the binary level
+      // regardless of stealth-plugin JS patches.
+      browser = await chromium.launch({
+        headless: !opts.headed,
+        executablePath: getStealthExecutablePath(),
+      });
     } catch (err) {
       return {
         ok: false,
@@ -159,10 +151,23 @@ export async function runPlaybook(opts: RunPlaybookOptions): Promise<ToolResult>
   } catch (err) {
     const screenshotPath = await screenshot(page, playbook.toolName, lastStep);
     const suffix = screenshotPath ? `\nscreenshot: ${screenshotPath}` : '';
+    const errStr = errMsg(err);
+    // Classify the failure mode honestly: a missing locator, a step
+    // timeout, or a `forResponse` wait that didn't resolve are
+    // transient page-state signals (the DOM rendered differently than
+    // the recording, or the page was slow). Those are NETWORK-class
+    // signals, not tool-defect (BAD_RESPONSE) signals — the audit
+    // gate's `tool_broken` classifier treats BAD_RESPONSE as a real
+    // bug, which over-attributes drift to defects. Map known
+    // transient-shape errors to NETWORK so they count as `infra`
+    // (re-runnable) rather than `tool_broken` (permanent defect).
+    const isTransient = /No locator matched|Timeout \d+ms exceeded|forResponse|waiting for/i.test(
+      errStr,
+    );
     return {
       ok: false,
-      error: 'BAD_RESPONSE',
-      message: `Playbook failed at step ${lastStep}: ${errMsg(err)}${suffix}`,
+      error: isTransient ? 'NETWORK' : 'BAD_RESPONSE',
+      message: `Playbook failed at step ${lastStep}: ${errStr}${suffix}`,
     };
   } finally {
     if (!opts.pageOverride) {
@@ -252,11 +257,36 @@ async function executeStep(
     case 'type': {
       const locator = await firstMatching(page, step.locators, params, timeoutMs);
       const value = subst(step.value, params);
-      if (step.clear === false) {
-        await locator.pressSequentially(value, { timeout: timeoutMs });
-      } else {
-        await locator.fill(value, { timeout: timeoutMs });
+      // Detect element type so we dispatch the right action. `type` on a
+      // <select> means "choose the option whose value/label matches" —
+      // a recording can capture either action shape, and the audit-time
+      // tool may also call type with a value that happens to land on a
+      // select. Without this branch, fill()/pressSequentially() throw
+      // "Element is not an input/textarea" and the whole playbook
+      // aborts.
+      const tagName = await locator.evaluate((el) => el.tagName.toLowerCase());
+      if (tagName === 'select') {
+        // Try value first, fall back to label — match Playwright's own
+        // selectOption semantics.
+        try {
+          await locator.selectOption({ value }, { timeout: timeoutMs });
+        } catch {
+          await locator.selectOption({ label: value }, { timeout: timeoutMs });
+        }
+        await applyWait(page, step.wait_for, locator, timeoutMs);
+        return;
+      }
+      // Inputs / textareas: pressSequentially fires real input / keydown
+      // / keyup events. React-style frameworks bind to synthetic events
+      // that locator.fill() doesn't trigger — typing into an autocomplete
+      // or debounced search field with fill() updates the input visually
+      // but the framework's onChange handler never runs, so the dropdown
+      // / XHR / next-step locator times out. The ~10ms-per-char internal
+      // delay is negligible against page-load latency.
+      if (step.clear !== false) {
+        await locator.fill('', { timeout: timeoutMs });
       }
+      await locator.pressSequentially(value, { timeout: timeoutMs });
       await applyWait(page, step.wait_for, locator, timeoutMs);
       return;
     }
@@ -376,10 +406,27 @@ async function applyWait(
   }
   if ('xhr' in wait) {
     const re = new RegExp(wait.xhr);
-    await page.waitForResponse(
-      (resp) => re.test(resp.url()) && (!wait.method || resp.request().method() === wait.method),
-      { timeout: wait.timeout_ms ?? timeoutMs },
-    );
+    try {
+      await page.waitForResponse(
+        (resp) => re.test(resp.url()) && (!wait.method || resp.request().method() === wait.method),
+        { timeout: wait.timeout_ms ?? timeoutMs },
+      );
+    } catch (err) {
+      // A missed `wait_for: {xhr: ...}` is usually a soft signal: the
+      // recorded action (typing into an autocomplete, clicking a tab)
+      // happened, but the page didn't fire the exact XHR we matched on
+      // — either the URL pattern drifted, the debounce window was
+      // tighter than our wait, or the page chose a cached response. The
+      // next playbook step has its own locator / wait_for and will fail
+      // loudly if the page state is actually wrong. Letting the
+      // playbook continue here gives it a real chance to recover
+      // (observed on Costco's pickup-location autocomplete: typing
+      // succeeded, the XHR just never fired before our 30s window).
+      const msg = err instanceof Error ? err.message : String(err);
+      // Re-throw closures / nav errors that aren't simple timeouts —
+      // those signal real page breakdown.
+      if (!/timeout|Timeout/.test(msg)) throw err;
+    }
     return;
   }
   if ('sleep_ms' in wait) {
@@ -387,7 +434,10 @@ async function applyWait(
   }
 }
-async function extractResult(
+/** Exported for testing — drives the XHR-body extraction contract that
+ *  must stay symmetric with the workflow runtime (runtime.ts:279-285).
+ */
+export async function extractResult(
   page: Page,
   result: PlaybookResult,
   captured: Array<{ url: string; method: string; status: number; body: string | null }>,
@@ -410,16 +460,27 @@ async function extractResult(
         `Result XHR returned ${last.status} (${last.url}): ${last.body.slice(0, 300)}.${hint}`,
       );
     }
-    let parsed: unknown;
+    // Mirror runtime.ts (workflow path) semantics: try JSON first, but fall
+    // back to the raw body string when parsing fails. Many APIs return
+    // non-JSON envelopes that a downstream parser knows how to decode —
+    // Google XSSI prefix (`)]}'`), chunked batchexecute payloads, JSONP
+    // callbacks, protobuf-over-HTTP, etc. Throwing here would bypass the
+    // parser entirely; passing the raw bytes lets the parser do its job and
+    // keeps the playbook fallback's contract symmetric with the workflow
+    // path.
+    let parsed: unknown = last.body;
     try {
       parsed = JSON.parse(last.body);
     } catch {
-      throw new Error(`Result XHR body was not JSON (${last.url}): ${last.body.slice(0, 200)}`);
+      // Path-based extraction (`items[].id`) needs a structured value to
+      // navigate, so we still fail loudly in that case. Whole-body
+      // extraction (`extract === '*'`) is the contract that says "the
+      // parser owns the bytes," so we pass them through.
+      if (result.extract !== '*' && result.extract !== '') {
+        throw new Error(`Result XHR body was not JSON (${last.url}): ${last.body.slice(0, 200)}`);
+      }
     }
-    // `*` returns the full parsed JSON unchanged — useful when the consumer
-    // (parser.ts, MCP caller) wants the rich object graph rather than just
-    // numeric leaves.
-    if (result.extract === '*') {
+    if (result.extract === '*' || result.extract === '') {
       return { [result.return_as]: parsed, source_url: last.url };
     }
     return { [result.return_as]: extractAt(parsed, result.extract), source_url: last.url };