npm - @totalreclaw/totalreclaw - Versions diffs - 3.3.1-rc.2 → 3.3.1-rc.21 - Mend

@totalreclaw/totalreclaw 3.3.1-rc.2 → 3.3.1-rc.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

package/CHANGELOG.md +330 -0
package/SKILL.md +50 -83
package/api-client.ts +18 -11
package/config.ts +117 -3
package/crypto.ts +10 -2
package/dist/api-client.js +226 -0
package/dist/billing-cache.js +100 -0
package/dist/claims-helper.js +606 -0
package/dist/config.js +280 -0
package/dist/consolidation.js +258 -0
package/dist/contradiction-sync.js +1034 -0
package/dist/crypto.js +138 -0
package/dist/digest-sync.js +361 -0
package/dist/download-ux.js +63 -0
package/dist/embedding.js +86 -0
package/dist/extractor.js +1225 -0
package/dist/first-run.js +103 -0
package/dist/fs-helpers.js +563 -0
package/dist/gateway-url.js +197 -0
package/dist/generate-mnemonic.js +13 -0
package/dist/hot-cache-wrapper.js +101 -0
package/dist/import-adapters/base-adapter.js +64 -0
package/dist/import-adapters/chatgpt-adapter.js +238 -0
package/dist/import-adapters/claude-adapter.js +114 -0
package/dist/import-adapters/gemini-adapter.js +201 -0
package/dist/import-adapters/index.js +26 -0
package/dist/import-adapters/mcp-memory-adapter.js +219 -0
package/dist/import-adapters/mem0-adapter.js +158 -0
package/dist/import-adapters/types.js +1 -0
package/dist/index.js +5348 -0
package/dist/llm-client.js +686 -0
package/dist/llm-profile-reader.js +346 -0
package/dist/lsh.js +62 -0
package/dist/onboarding-cli.js +750 -0
package/dist/pair-cli.js +344 -0
package/dist/pair-crypto.js +359 -0
package/dist/pair-http.js +404 -0
package/dist/pair-page.js +826 -0
package/dist/pair-qr.js +107 -0
package/dist/pair-remote-client.js +410 -0
package/dist/pair-session-store.js +566 -0
package/dist/pin.js +542 -0
package/dist/qa-bug-report.js +301 -0
package/dist/relay-headers.js +44 -0
package/dist/reranker.js +442 -0
package/dist/retype-setscope.js +348 -0
package/dist/semantic-dedup.js +75 -0
package/dist/subgraph-search.js +289 -0
package/dist/subgraph-store.js +694 -0
package/dist/tool-gating.js +58 -0
package/download-ux.ts +91 -0
package/embedding.ts +32 -9
package/fs-helpers.ts +124 -0
package/gateway-url.ts +57 -9
package/index.ts +586 -357
package/llm-client.ts +211 -23
package/lsh.ts +7 -2
package/onboarding-cli.ts +114 -1
package/package.json +19 -5
package/pair-cli.ts +76 -8
package/pair-crypto.ts +34 -24
package/pair-page.ts +28 -17
package/pair-qr.ts +152 -0
package/pair-remote-client.ts +540 -0
package/qa-bug-report.ts +381 -0
package/relay-headers.ts +50 -0
package/reranker.ts +73 -0
package/retype-setscope.ts +12 -0
package/subgraph-search.ts +4 -3
package/subgraph-store.ts +109 -16

package/llm-client.ts CHANGED Viewed

@@ -72,8 +72,48 @@ const PROVIDER_KEY_NAMES: Record<string, string[]> = {
   cerebras:   ['cerebras'],
 };
+/**
+ * zai has TWO public endpoints. The CODING endpoint is what GLM Coding Plan
+ * subscription keys are provisioned against; the STANDARD (PAYG) endpoint
+ * serves pay-as-you-go balances. A coding-plan key that hits the STANDARD
+ * endpoint returns HTTP 429 with body `"Insufficient balance or no resource
+ * package. Please recharge."` — misleading because the subscription is in
+ * good standing. Vice-versa for PAYG keys that accidentally hit CODING.
+ *
+ * 3.3.1-rc.3: exported so the rc.3 auto-fallback (see `chatCompletion`)
+ * can flip between them when the upstream error signature matches.
+ */
+export const ZAI_CODING_BASE_URL = 'https://api.z.ai/api/coding/paas/v4';
+export const ZAI_STANDARD_BASE_URL = 'https://api.z.ai/api/paas/v4';
+/**
+ * Resolve the zai base URL.
+ *
+ * Precedence:
+ *   1. `ZAI_BASE_URL` env var (explicit operator override — read by
+ *      `CONFIG.zaiBaseUrl` via a getter so tests can mutate the env
+ *      between calls)
+ *   2. Default: coding endpoint (coding-plan-biased; the rc.3 auto-fallback
+ *      hops to the standard endpoint on an "Insufficient balance" 429).
+ *
+ * Documented in plugin SKILL.md — Coding-Plan users can leave it unset (or
+ * set it explicitly to `https://api.z.ai/api/coding/paas/v4`). PAYG users
+ * MUST set it to `https://api.z.ai/api/paas/v4` to avoid the auto-fallback
+ * tax on every first call.
+ *
+ * Scanner-isolation note: the env read lives in `config.ts` (which has no
+ * network triggers). This module has network calls, so it cannot touch
+ * env vars directly — both rules 1 (env-harvesting) and 2 (potential-
+ * exfiltration) in check-scanner.mjs would fire.
+ */
+export function getZaiBaseUrl(): string {
+  return CONFIG.zaiBaseUrl;
+}
 const PROVIDER_BASE_URLS: Record<string, string> = {
-  zai:        'https://api.z.ai/api/coding/paas/v4',
+  // zai: resolved lazily at each init/call so `ZAI_BASE_URL` env changes
+  // propagate without a module re-import. See `getZaiBaseUrl()`.
+  zai:        getZaiBaseUrl(),
   anthropic:  'https://api.anthropic.com/v1',
   openai:     'https://api.openai.com/v1',
   gemini:     'https://generativelanguage.googleapis.com/v1beta/openai',
@@ -196,7 +236,13 @@ function buildConfigForProvider(
     apiFormatOverride?: 'openai' | 'anthropic';
   } = {},
 ): LLMClientConfig | null {
-  const baseUrl = (opts.baseUrlOverride ?? PROVIDER_BASE_URLS[provider] ?? '').replace(/\/+$/, '');
+  // zai's base URL is resolved via `getZaiBaseUrl()` (reads CONFIG) so
+  // the `ZAI_BASE_URL` env override takes effect even when this helper is
+  // called with no `baseUrlOverride` (i.e. the env-var fallback tier in
+  // initLLMClient).
+  const defaultForProvider =
+    provider === 'zai' ? getZaiBaseUrl() : PROVIDER_BASE_URLS[provider] ?? '';
+  const baseUrl = (opts.baseUrlOverride ?? defaultForProvider).replace(/\/+$/, '');
   if (!baseUrl) return null;
   const model =
     opts.modelOverride ??
@@ -466,7 +512,7 @@ export function resolveLLMConfig(): LLMClientConfig | null {
   if (zaiKey) {
     return {
       apiKey: zaiKey,
-      baseUrl: 'https://api.z.ai/api/coding/paas/v4',
+      baseUrl: getZaiBaseUrl(),
       model,
       apiFormat: 'openai',
     };
@@ -486,22 +532,29 @@ export function resolveLLMConfig(): LLMClientConfig | null {
 /**
  * Options for chatCompletion. `retry` controls the 429 + timeout backoff
- * loop added in 3.3.1-rc.2 — 5 of 6 extraction windows failed in the
- * 3.3.1-rc.1 QA because zai 429s had no retry path.
+ * loop. Defaults to 5 attempts with 2s → 4s → 8s → 16s → 32s backoff
+ * (total budget ~62s) — rc.1/rc.2 QA showed multi-minute upstream outages
+ * that blew through the rc.2 7s budget. Configurable via
+ * `TOTALRECLAW_LLM_RETRY_BUDGET_MS` env (cap on cumulative retry-delay).
  */
 export interface ChatCompletionOptions {
   maxTokens?: number;
   temperature?: number;
   /**
-   * Retry behaviour. Defaults to { attempts: 3, baseDelayMs: 1000 } —
-   * 1s → 2s → 4s exponential backoff on 429 or transient timeout. First
-   * failure logs at INFO (single-line, no stack), subsequent attempts at
-   * DEBUG. Set `attempts: 0` to disable retry entirely. Pass a `logger`
-   * for visibility; without one, retries are silent.
+   * Retry behaviour. Defaults mirror the rc.3 budget: 5 attempts, 2s base
+   * delay, exponential. Set `attempts: 0` (or `1`) to disable retry. Pass
+   * a `logger` for visibility; without one, retries are silent.
+   *
+   * `budgetMs` caps the cumulative retry-delay time — after an attempt
+   * fails, we compute the next delay and skip it (falling through to the
+   * give-up path) if adding it would exceed the budget. Defaults to the
+   * value read from `TOTALRECLAW_LLM_RETRY_BUDGET_MS` at module load,
+   * which itself defaults to 60_000ms.
    */
   retry?: {
     attempts?: number;
     baseDelayMs?: number;
+    budgetMs?: number;
   };
   logger?: {
     info?: (msg: string) => void;
@@ -512,17 +565,76 @@ export interface ChatCompletionOptions {
   timeoutMs?: number;
 }
+/**
+ * Default retry budget in ms. Configurable via
+ * `TOTALRECLAW_LLM_RETRY_BUDGET_MS` env var — read by `config.ts`. Callers
+ * can override per-call via `retry.budgetMs`. 60_000ms covers ~8 minutes
+ * worth of upstream outages with the 2s→32s schedule.
+ *
+ * Scanner-isolation note: the env read lives in `config.ts` so this file
+ * stays clean of env-harvesting triggers.
+ */
+export const DEFAULT_RETRY_BUDGET_MS: number = CONFIG.llmRetryBudgetMs;
+/**
+ * Structured error thrown when the extraction LLM upstream is unreachable
+ * after the full retry budget is exhausted. The extraction pipeline
+ * recognizes this via `err instanceof LLMUpstreamOutageError` and can
+ * choose to:
+ *   - queue the message batch for retry next turn,
+ *   - surface a one-time notification to the user, or
+ *   - simply skip this extraction window silently.
+ */
+export class LLMUpstreamOutageError extends Error {
+  readonly attempts: number;
+  readonly lastStatus?: number;
+  constructor(message: string, attempts: number, lastStatus?: number) {
+    super(message);
+    this.name = 'LLMUpstreamOutageError';
+    this.attempts = attempts;
+    this.lastStatus = lastStatus;
+  }
+}
+/**
+ * Detect the "Insufficient balance" error shape from zai. Matches both
+ * the exact production wording ("Insufficient balance or no resource
+ * package. Please recharge.") and the short "no resource package" variant
+ * we've seen in some historical responses.
+ */
+export function isZaiBalanceError(errorMessage: string): boolean {
+  const m = errorMessage.toLowerCase();
+  return m.includes('insufficient balance') || m.includes('no resource package');
+}
+/**
+ * Identify the "other" zai endpoint when the current one returns a balance
+ * error — CODING ↔ STANDARD. Returns `null` when the URL is neither of
+ * the two zai endpoints we know about (e.g. a self-hosted proxy), which
+ * means the fallback logic stays put.
+ */
+export function zaiFallbackBaseUrl(currentBaseUrl: string): string | null {
+  const normalized = currentBaseUrl.replace(/\/+$/, '');
+  if (normalized === ZAI_CODING_BASE_URL) return ZAI_STANDARD_BASE_URL;
+  if (normalized === ZAI_STANDARD_BASE_URL) return ZAI_CODING_BASE_URL;
+  return null;
+}
 /**
  * Call the LLM chat completion endpoint.
  *
  * Supports both OpenAI-compatible format and Anthropic Messages API,
  * determined by `config.apiFormat`.
  *
- * 3.3.1-rc.2 — adds an exponential-backoff retry wrapper for HTTP 429 +
- * timeout transients. Every retry attempt respects the per-attempt
- * `timeoutMs` (default 30s). Max 3 total attempts by default (1s, 2s, 4s
- * backoff). Non-retryable errors (4xx other than 429, network refused,
- * JSON parse) fail fast on the first attempt.
+ * 3.3.1-rc.3 — lifts the retry budget 5 attempts × (2s/4s/8s/16s/32s), total
+ * ~62s. Configurable via `TOTALRECLAW_LLM_RETRY_BUDGET_MS`. Adds zai
+ * "Insufficient balance" auto-fallback: when a zai 429 carries the balance
+ * error body AND we're on one of the two known zai endpoints, we flip to
+ * the OTHER endpoint and retry ONCE (accounted for separately from the
+ * normal retry loop). On exhaustion, throws `LLMUpstreamOutageError`.
+ *
+ * Non-retryable errors (4xx other than 429, network refused, JSON parse)
+ * fail fast on the first attempt.
  *
  * @returns The assistant's response content, or null on failure.
  */
@@ -533,34 +645,96 @@ export async function chatCompletion(
 ): Promise<string | null> {
   const maxTokens = options?.maxTokens ?? 2048;
   const temperature = options?.temperature ?? 0; // Deterministic output for dedup (same input → same text → same content fingerprint)
-  const attempts = Math.max(1, options?.retry?.attempts ?? 3);
-  const baseDelayMs = Math.max(100, options?.retry?.baseDelayMs ?? 1000);
+  const attempts = Math.max(1, options?.retry?.attempts ?? 5);
+  const baseDelayMs = Math.max(100, options?.retry?.baseDelayMs ?? 2000);
+  const budgetMs = Math.max(100, options?.retry?.budgetMs ?? DEFAULT_RETRY_BUDGET_MS);
   const timeoutMs = options?.timeoutMs ?? 30_000;
   const logger = options?.logger;
+  // We mutate `activeConfig.baseUrl` in the zai fallback branch so the
+  // retried call hits the other endpoint. Shallow-clone so the caller's
+  // config object stays untouched.
+  const activeConfig: LLMClientConfig = { ...config };
+  // One-shot flag: we only auto-fallback zai once per chatCompletion call
+  // to prevent ping-pong between the two endpoints if both reject.
+  let zaiFallbackAttempted = false;
   const callOnce = (): Promise<string | null> =>
-    config.apiFormat === 'anthropic'
-      ? chatCompletionAnthropic(config, messages, maxTokens, temperature, timeoutMs)
-      : chatCompletionOpenAI(config, messages, maxTokens, temperature, timeoutMs);
+    activeConfig.apiFormat === 'anthropic'
+      ? chatCompletionAnthropic(activeConfig, messages, maxTokens, temperature, timeoutMs)
+      : chatCompletionOpenAI(activeConfig, messages, maxTokens, temperature, timeoutMs);
   let lastErr: unknown;
+  let cumulativeDelayMs = 0;
+  let lastStatus: number | undefined;
   for (let attempt = 1; attempt <= attempts; attempt++) {
     try {
       return await callOnce();
     } catch (err) {
       lastErr = err;
       const msg = err instanceof Error ? err.message : String(err);
+      lastStatus = parseHttpStatus(msg) ?? lastStatus;
+      // ── zai "Insufficient balance" auto-fallback ──
+      // Fires BEFORE the normal retry accounting. If the error is a zai
+      // balance-shaped 429, flip the baseUrl once and immediately retry —
+      // no backoff, no decrement of the attempt count. Keeps the total
+      // attempt budget reserved for genuine outages.
+      if (!zaiFallbackAttempted && /\b429\b/.test(msg) && isZaiBalanceError(msg)) {
+        const fallback = zaiFallbackBaseUrl(activeConfig.baseUrl);
+        if (fallback) {
+          zaiFallbackAttempted = true;
+          const oldUrl = activeConfig.baseUrl;
+          activeConfig.baseUrl = fallback;
+          logger?.info?.(
+            `chatCompletion: zai endpoint auto-fallback: ${oldUrl} → ${fallback} due to "Insufficient balance" response`,
+          );
+          // Retry immediately — do NOT decrement attempts counter further;
+          // this "extra" attempt is the fallback freebie.
+          attempt--;
+          continue;
+        }
+      }
       const retryable = isRetryable(msg);
       const isFinalAttempt = attempt >= attempts;
       if (!retryable || isFinalAttempt) {
         // Fail-fast OR last attempt — rethrow.
-        if (attempt > 1) {
-          logger?.warn?.(`chatCompletion: giving up after ${attempt} attempts: ${msg.slice(0, 200)}`);
+        if (attempt > 1 || !retryable) {
+          if (retryable) {
+            logger?.warn?.(`chatCompletion: giving up after ${attempt} attempts: ${msg.slice(0, 200)}`);
+          }
+          // Structured outage error when the retryable error budget is
+          // fully exhausted — lets downstream recognize vs bail silently.
+          if (retryable) {
+            throw new LLMUpstreamOutageError(
+              `LLM upstream outage after ${attempt} attempts: ${msg.slice(0, 200)}`,
+              attempt,
+              lastStatus,
+            );
+          }
         }
         throw err;
       }
-      // Retry. INFO on first failure (visible), DEBUG on subsequent.
+      // Compute next delay, but respect the cumulative retry-budget cap.
       const delayMs = baseDelayMs * Math.pow(2, attempt - 1);
+      if (cumulativeDelayMs + delayMs > budgetMs) {
+        logger?.warn?.(
+          `chatCompletion: retry budget exhausted (${cumulativeDelayMs}ms used + ${delayMs}ms next > ${budgetMs}ms budget); surfacing outage after ${attempt} attempts: ${msg.slice(0, 160)}`,
+        );
+        throw new LLMUpstreamOutageError(
+          `LLM upstream outage (budget ${budgetMs}ms exhausted after ${attempt} attempts): ${msg.slice(0, 200)}`,
+          attempt,
+          lastStatus,
+        );
+      }
+      cumulativeDelayMs += delayMs;
+      // Log only the FIRST retry at INFO to avoid spamming during long
+      // outages; subsequent retries are DEBUG (debounced per outage).
       if (attempt === 1) {
         logger?.info?.(
           `chatCompletion: retrying after transient failure (attempt ${attempt}/${attempts}, wait ${delayMs}ms): ${msg.slice(0, 160)}`,
@@ -578,6 +752,20 @@ export async function chatCompletion(
   throw lastErr instanceof Error ? lastErr : new Error(String(lastErr));
 }
+/**
+ * Parse the HTTP status code from an error message of the form
+ * `"LLM API 429: rate limit"` or `"Anthropic API 503: ..."`. Returns
+ * `undefined` when the message doesn't follow that shape (e.g. network
+ * refused). Used by `LLMUpstreamOutageError.lastStatus` for downstream
+ * classification.
+ */
+function parseHttpStatus(errorMessage: string): number | undefined {
+  const m = errorMessage.match(/\b(\d{3})\b/);
+  if (!m) return undefined;
+  const code = parseInt(m[1], 10);
+  return code >= 100 && code < 600 ? code : undefined;
+}
 /**
  * Which LLM-call errors are worth retrying. Exported for testability.
  *

package/lsh.ts CHANGED Viewed

@@ -7,10 +7,15 @@
  * Default parameters: 32 bits per table, 20 tables.
  */
-// Lazy-load WASM to avoid crash when npm install hasn't finished yet.
+// Lazy-load WASM via createRequire. The shipped `dist/index.js` is ESM-only
+// (`"type":"module"`) so the bare `require` global is undefined at runtime.
+// See issue #124 for the bug this avoids; matches the pattern in
+// claims-helper / consolidation / digest-sync / pin / retype-setscope.
+import { createRequire } from 'node:module';
+const requireWasm = createRequire(import.meta.url);
 let _WasmLshHasher: typeof import('@totalreclaw/core')['WasmLshHasher'] | null = null;
 function getWasmLshHasher() {
-  if (!_WasmLshHasher) _WasmLshHasher = require('@totalreclaw/core').WasmLshHasher;
+  if (!_WasmLshHasher) _WasmLshHasher = requireWasm('@totalreclaw/core').WasmLshHasher;
   return _WasmLshHasher!;
 }

package/onboarding-cli.ts CHANGED Viewed

@@ -59,6 +59,23 @@ import {
 // has one place to grow into later).
 // ---------------------------------------------------------------------------
+/**
+ * 3.3.1-rc.18 (issue #95) — deprecation warning for the interactive
+ * phrase-print branch. Emitted to STDERR (never stdout) so it is visible
+ * to humans but does not pollute any pipe consuming the wizard's output.
+ *
+ * The phrase-print branch will be REMOVED in the next RC after rc.18.
+ * Users running on a TTY can still complete the flow in rc.18; agents
+ * MUST use `--pair-only` or the `totalreclaw_pair` tool today.
+ */
+export const PHRASE_PRINT_DEPRECATION_WARNING =
+  '\nDEPRECATION (issue #95): the interactive `openclaw totalreclaw onboard` flow\n' +
+  '  prints your recovery phrase to this terminal. This is being removed in the\n' +
+  '  next release candidate. For agent / scripted invocation, use:\n' +
+  '    openclaw totalreclaw onboard --pair-only\n' +
+  '  which emits ONLY {pair_url, pin} JSON and routes the phrase through the\n' +
+  '  browser flow (never on stdout).\n\n';
 export const COPY = {
   welcome:
     '\nTotalReclaw — Secure onboarding\n\n' +
@@ -403,6 +420,11 @@ export async function runOnboardingWizard(deps: WizardDeps): Promise<WizardResul
   }
   if (choice === 'generate') {
+    // 3.3.1-rc.18 (issue #95) — deprecation banner on stderr ONLY.
+    // The phrase-print branch is scheduled for removal in the RC after
+    // rc.18; we keep it functional in rc.18 for back-compat with users
+    // running the wizard on a real TTY today.
+    io.stderr.write(PHRASE_PRINT_DEPRECATION_WARNING);
     io.stdout.write(COPY.generateWarning);
     io.stdout.write(COPY.importRemoteLimitation);
     const mnemonic = genMnemonic();
@@ -674,6 +696,22 @@ export async function runNonInteractiveOnboard(
  *   --emit-phrase          Include the plaintext phrase in the JSON payload
  *                          (NOT recommended — the phrase lives in
  *                          credentials.json; prefer reading it there).
+ *
+ * 3.3.1-rc.18 — `onboard` accepts:
+ *   --pair-only            Phrase-safe agent-shell flag (issue #95).
+ *                          Delegates to the pair flow and emits a single
+ *                          line of JSON `{v, pair_url, pin, expires_at_ms}`
+ *                          to stdout. Phrase NEVER touches stdout, stderr,
+ *                          or the logger in this mode. Use this for any
+ *                          agent-driven setup; it is the recommended path
+ *                          when a container-based agent does not have the
+ *                          `totalreclaw_pair` tool injected.
+ *
+ *                          Requires `pairSessionsPath` + `renderPairingUrl`
+ *                          to be supplied to `registerOnboardingCli`. If
+ *                          absent, `--pair-only` exits non-zero with a
+ *                          clear message instead of falling through to the
+ *                          phrase-print branch.
  */
 export function registerOnboardingCli(
   program: import('commander').Command,
@@ -683,6 +721,10 @@ export function registerOnboardingCli(
     logger: { info(msg: string): void; warn(msg: string): void; error(msg: string): void };
     /** Caller-supplied helper for scope-address derivation. Optional — when absent, JSON output omits `scope_address`. */
     deriveScopeAddress?: (mnemonic: string) => Promise<string | undefined>;
+    /** Caller-supplied path to the pair-session store. Required for `--pair-only`. */
+    pairSessionsPath?: string;
+    /** Caller-supplied URL renderer for the pair flow. Required for `--pair-only`. */
+    renderPairingUrl?: (session: import('./pair-session-store.js').PairSession) => string;
   },
 ): void {
   const tr = program
@@ -690,12 +732,13 @@ export function registerOnboardingCli(
     .description('TotalReclaw encrypted memory — secure onboarding + status');
   tr.command('onboard')
-    .description('Interactive onboarding: generate or import a recovery phrase (runs locally, no LLM)')
+    .description('Interactive onboarding: generate or import a recovery phrase (runs locally, no LLM). For agent-driven setup prefer --pair-only.')
     .option('--non-interactive', 'Exit non-zero if any input would be prompted for (agent-driven use)')
     .option('--json', 'Emit the result as a structured JSON payload. Only valid with --non-interactive.')
     .option('--mode <mode>', 'generate | restore — skip the menu prompt')
     .option('--phrase <phrase>', 'Recovery phrase for --mode restore. `-` reads from stdin.')
     .option('--emit-phrase', 'Include the plaintext phrase in the JSON payload (not recommended). Default: false.')
+    .option('--pair-only', 'Phrase-safe agent-invocation mode (issue #95). Emits ONLY {v,pair_url,pin,expires_at_ms} JSON to stdout via the pair flow. Phrase never touches stdout/stderr/logger. RECOMMENDED for any agent or scripted invocation.')
     .action(async (...actionArgs: unknown[]) => {
       // commander: (options, cmd)
       const cliOpts = (actionArgs[0] ?? {}) as {
@@ -704,8 +747,70 @@ export function registerOnboardingCli(
         mode?: string;
         phrase?: string;
         emitPhrase?: boolean;
+        pairOnly?: boolean;
       };
+      // ---------------------------------------------------------------
+      // 3.3.1-rc.18 — `--pair-only` (issue #95)
+      //
+      // Phrase-safe agent-shell flag. Delegates to the pair flow and
+      // emits a single line of JSON `{v, pair_url, pin, expires_at_ms}`
+      // to stdout. By construction:
+      //   - The pair flow is x25519-only — pair-crypto.ts does NOT
+      //     import @scure/bip39 and never touches a recovery phrase.
+      //   - No interactive prompts, no readline, no @scure/bip39 import
+      //     in this code path. Phrase never enters stdout/stderr/logger.
+      //   - Stays silent on status transitions (the runPairCli
+      //     `pair-only` output mode suppresses banners, spinners, and
+      //     all human-readable copy).
+      //
+      // This MUST be the path agents take when they need to set up
+      // TotalReclaw via a shell. The interactive phrase-print branch
+      // below is deprecated for that use case and emits a warning when
+      // the user falls through to it.
+      // ---------------------------------------------------------------
+      if (cliOpts.pairOnly) {
+        if (!opts.pairSessionsPath || !opts.renderPairingUrl) {
+          process.stderr.write(
+            '--pair-only is unavailable: this OpenClaw build did not wire the pair flow into the onboard CLI. ' +
+              'Use `openclaw totalreclaw pair generate --url-pin-only` instead.\n',
+          );
+          process.exit(1);
+        }
+        // Resolve mode. --mode restore is incompatible with --pair-only
+        // since pair flow's "import" mode runs in the browser, not in
+        // the CLI. Default to 'generate' silently.
+        const pairMode = cliOpts.mode === 'restore' || cliOpts.mode === 'import' ? 'import' : 'generate';
+        // Lazy import — keeps pair-cli + qrcode-terminal off the
+        // onboarding hot path when --pair-only is not used.
+        const { runPairCli, defaultRenderQr, buildDefaultPairCliIo } = await import('./pair-cli.js');
+        const io = buildDefaultPairCliIo();
+        try {
+          const outcome = await runPairCli(pairMode, {
+            sessionsPath: opts.pairSessionsPath,
+            renderPairingUrl: opts.renderPairingUrl,
+            renderQr: defaultRenderQr,
+            io,
+            outputMode: 'pair-only',
+          });
+          if (outcome.status !== 'completed') {
+            process.exit(outcome.status === 'canceled' ? 130 : 1);
+          }
+          process.exit(0);
+        } catch (err) {
+          // CRITICAL: this catch MUST NOT include the phrase, the
+          // mnemonic, or any user secret in the message. The pair flow
+          // does not produce phrase material, so this is structurally
+          // safe — but defense-in-depth: emit a fixed error string.
+          opts.logger.error(
+            `pair-only delegation crashed: ${err instanceof Error ? err.message : String(err)}`,
+          );
+          process.stderr.write('--pair-only failed (see logs).\n');
+          process.exit(2);
+        }
+      }
       if (cliOpts.nonInteractive) {
         // Non-interactive path — no readline, no prompts.
         const mode: 'generate' | 'restore' | null =
@@ -744,10 +849,18 @@ export function registerOnboardingCli(
         });
         if (cliOpts.json) {
+          // 3.3.1-rc.18 (issue #95) — emit deprecation on stderr when
+          // the JSON payload is about to include the plaintext phrase.
+          // stderr is intentional: stdout must remain a single
+          // machine-parseable JSON line.
+          if (cliOpts.emitPhrase && result.ok && result.mnemonic) {
+            process.stderr.write(PHRASE_PRINT_DEPRECATION_WARNING);
+          }
           process.stdout.write(JSON.stringify(result) + '\n');
         } else {
           if (result.ok) {
             if (result.mnemonic) {
+              process.stderr.write(PHRASE_PRINT_DEPRECATION_WARNING);
               process.stderr.write(
                 'WARNING: --emit-phrase was set. The plaintext recovery phrase was returned.\n' +
                   'For agent-driven flows, prefer reading ~/.totalreclaw/credentials.json directly ' +

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@totalreclaw/totalreclaw",
-  "version": "3.3.1-rc.2",
+  "version": "3.3.1-rc.21",
   "description": "End-to-end encrypted, agent-portable memory for OpenClaw and any LLM-agent runtime. XChaCha20-Poly1305 with protobuf v4 + on-chain Memory Taxonomy v1 (claim / preference / directive / commitment / episode / summary).",
   "type": "module",
   "keywords": [
@@ -31,13 +31,23 @@
   "author": "TotalReclaw Team",
   "license": "MIT",
   "dependencies": {
+    "@huggingface/transformers": "^4.0.1",
     "@totalreclaw/client": "^1.2.0",
     "@totalreclaw/core": "^2.1.1",
-    "@huggingface/transformers": "^4.0.1",
+    "@types/qrcode": "^1.5.6",
+    "@types/ws": "^8.5.12",
     "onnxruntime-node": "^1.24.0",
-    "qrcode-terminal": "^0.12.0"
+    "qrcode": "^1.5.4",
+    "qrcode-terminal": "^0.12.0",
+    "ws": "^8.18.3"
+  },
+  "devDependencies": {
+    "typescript": "^5.5.0"
   },
+  "main": "./dist/index.js",
+  "types": "./dist/index.d.ts",
   "files": [
+    "dist/",
     "*.ts",
     "import-adapters/",
     "!**/*.test.ts",
@@ -50,13 +60,17 @@
     "skill.json"
   ],
   "scripts": {
-    "test": "npx tsx manifest-shape.test.ts && npx tsx config-schema.test.ts && npx tsx llm-profile-reader.test.ts && npx tsx llm-client.test.ts && npx tsx llm-client-retry.test.ts && npx tsx gateway-url.test.ts && npx tsx retype-setscope.test.ts && npx tsx tool-gating.test.ts && npx tsx onboarding-noninteractive.test.ts && npx tsx pair-cli-json.test.ts",
+    "build": "rm -rf dist && tsc -p tsconfig.json --noCheck",
+    "verify-tarball": "node ../scripts/verify-tarball.mjs",
+    "test": "npx tsx manifest-shape.test.ts && npx tsx config-schema.test.ts && npx tsx config.test.ts && npx tsx relay-headers.test.ts && npx tsx scope-address-visible.test.ts && npx tsx llm-profile-reader.test.ts && npx tsx llm-client.test.ts && npx tsx llm-client-retry.test.ts && npx tsx gateway-url.test.ts && npx tsx retype-setscope.test.ts && npx tsx tool-gating.test.ts && npx tsx onboarding-noninteractive.test.ts && npx tsx pair-cli-json.test.ts && npx tsx pair-qr.test.ts && npx tsx pair-remote-client.test.ts && npx tsx qa-bug-report.test.ts && npx tsx nonce-serialization.test.ts && npx tsx phrase-safety-registry.test.ts && npx tsx test_issue_92_onnx_download_ux.test.ts && npx tsx onboard-pair-only.test.ts && npx tsx import-time-smoke.test.ts && npx tsx recall-relevance-gate.test.ts && npx tsx install-staging-cleanup.test.ts && npx tsx json-stdout-cleanliness.test.ts",
+    "smoke:dist": "npx tsx dist-esm-smoke.test.ts",
     "check-scanner": "node ../scripts/check-scanner.mjs",
+    "prepack": "npm run build",
     "prepublishOnly": "node ../scripts/check-scanner.mjs"
   },
   "openclaw": {
     "extensions": [
-      "./index.ts"
+      "./dist/index.js"
     ]
   }
 }