npm - switchroom - Versions diffs - 0.8.1 → 0.11.0 - Mend

switchroom 0.8.1 → 0.11.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (137) hide show

package/README.md +54 -61
package/bin/timezone-hook.sh +9 -7
package/dist/agent-scheduler/index.js +285 -45
package/dist/auth-broker/index.js +13932 -0
package/dist/cli/drive-write-pretool.mjs +5418 -0
package/dist/cli/switchroom.js +8890 -5560
package/dist/host-control/main.js +582 -43
package/dist/vault/approvals/kernel-server.js +276 -47
package/dist/vault/broker/server.js +333 -69
package/examples/minimal.yaml +63 -0
package/examples/personal-google-workspace-mcp/.env.example +34 -0
package/examples/personal-google-workspace-mcp/README.md +194 -0
package/examples/personal-google-workspace-mcp/compose.yaml +66 -0
package/examples/switchroom.yaml +220 -0
package/package.json +6 -4
package/profiles/_base/start.sh.hbs +3 -3
package/profiles/_shared/agent-self-service.md.hbs +126 -0
package/profiles/default/CLAUDE.md +10 -0
package/profiles/default/CLAUDE.md.hbs +16 -0
package/skills/buildkite-agent-infrastructure/SKILL.md +30 -11
package/skills/buildkite-agent-runtime/SKILL.md +44 -11
package/skills/buildkite-api/SKILL.md +31 -8
package/skills/buildkite-cli/SKILL.md +27 -9
package/skills/buildkite-migration/SKILL.md +22 -9
package/skills/buildkite-pipelines/SKILL.md +26 -9
package/skills/buildkite-secure-delivery/SKILL.md +23 -9
package/skills/buildkite-test-engine/SKILL.md +25 -8
package/skills/docx/SKILL.md +1 -1
package/skills/file-bug/SKILL.md +34 -6
package/skills/humanizer/SKILL.md +15 -0
package/skills/humanizer-calibrate/SKILL.md +7 -1
package/skills/mcp-builder/SKILL.md +1 -1
package/skills/pdf/SKILL.md +1 -1
package/skills/pptx/SKILL.md +1 -1
package/skills/skill-creator/SKILL.md +21 -1
package/skills/skill-creator/scripts/__pycache__/__init__.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/generate_report.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/improve_description.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/run_eval.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/run_loop.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/utils.cpython-313.pyc +0 -0
package/skills/switchroom-cli/SKILL.md +63 -64
package/skills/switchroom-health/SKILL.md +23 -10
package/skills/switchroom-install/SKILL.md +3 -3
package/skills/switchroom-manage/SKILL.md +26 -19
package/skills/switchroom-runtime/SKILL.md +67 -15
package/skills/switchroom-status/SKILL.md +26 -1
package/skills/telegram-test-harness/SKILL.md +3 -0
package/skills/webapp-testing/SKILL.md +31 -1
package/skills/xlsx/SKILL.md +1 -1
package/telegram-plugin/admin-commands/dispatch.test.ts +1 -1
package/telegram-plugin/admin-commands/index.ts +9 -5
package/telegram-plugin/auth-snapshot-format.ts +612 -0
package/telegram-plugin/auto-fallback-fleet.ts +215 -0
package/telegram-plugin/auto-fallback.ts +28 -301
package/telegram-plugin/dist/gateway/gateway.js +17453 -15100
package/telegram-plugin/fleet-fallback-gate.ts +105 -0
package/telegram-plugin/gateway/approval-callback.test.ts +104 -0
package/telegram-plugin/gateway/approval-callback.ts +31 -3
package/telegram-plugin/gateway/auth-add-flow.ts +326 -0
package/telegram-plugin/gateway/auth-broker-client.ts +75 -0
package/telegram-plugin/gateway/auth-command.ts +905 -0
package/telegram-plugin/gateway/auth-line.ts +123 -0
package/telegram-plugin/gateway/auth-status-adapter.ts +101 -0
package/telegram-plugin/gateway/boot-card.ts +23 -37
package/telegram-plugin/gateway/boot-probes.ts +9 -12
package/telegram-plugin/gateway/diff-preview-card.test.ts +192 -0
package/telegram-plugin/gateway/diff-preview-card.ts +170 -0
package/telegram-plugin/gateway/drive-write-approval.test.ts +312 -0
package/telegram-plugin/gateway/drive-write-approval.ts +243 -0
package/telegram-plugin/gateway/folder-picker-handler.test.ts +314 -0
package/telegram-plugin/gateway/folder-picker-handler.ts +348 -0
package/telegram-plugin/gateway/gateway.ts +1156 -938
package/telegram-plugin/gateway/hostd-dispatch.ts +244 -0
package/telegram-plugin/gateway/ipc-protocol.ts +83 -2
package/telegram-plugin/gateway/ipc-server.ts +69 -0
package/telegram-plugin/hooks/sandbox-hint-posttool.mjs +103 -12
package/telegram-plugin/hooks/tool-label-pretool.mjs +11 -0
package/telegram-plugin/hooks/wedge-detect-posttool.mjs +303 -0
package/telegram-plugin/model-unavailable.ts +28 -12
package/telegram-plugin/permission-title.ts +56 -0
package/telegram-plugin/quota-check.ts +19 -41
package/telegram-plugin/scripts/build.mjs +0 -1
package/telegram-plugin/shared/bot-runtime.ts +5 -4
package/telegram-plugin/silence-poke.ts +153 -1
package/telegram-plugin/tests/auth-add-flow.test.ts +559 -0
package/telegram-plugin/tests/auth-code-redact.test.ts +8 -4
package/telegram-plugin/tests/auth-command-format2.test.ts +156 -0
package/telegram-plugin/tests/auth-command-vernacular.test.ts +531 -0
package/telegram-plugin/tests/auth-snapshot-format.test.ts +429 -0
package/telegram-plugin/tests/auth-status-adapter.test.ts +129 -0
package/telegram-plugin/tests/auto-fallback-fleet.test.ts +211 -0
package/telegram-plugin/tests/auto-fallback.test.ts +60 -358
package/telegram-plugin/tests/boot-probes.test.ts +27 -22
package/telegram-plugin/tests/fleet-fallback-gate.test.ts +197 -0
package/telegram-plugin/tests/model-unavailable.test.ts +30 -5
package/telegram-plugin/tests/permission-title.test.ts +31 -0
package/telegram-plugin/tests/quota-check.test.ts +5 -35
package/telegram-plugin/tests/sandbox-hint-posttool.test.ts +212 -2
package/telegram-plugin/tests/silence-poke.test.ts +237 -0
package/telegram-plugin/tests/turn-flush-safety.test.ts +112 -0
package/telegram-plugin/turn-flush-safety.ts +55 -1
package/telegram-plugin/uat/SETUP.md +35 -1
package/telegram-plugin/uat/runners/agent-self-sufficiency.ts +457 -0
package/telegram-plugin/uat/runners/paraphrases.ts +231 -0
package/telegram-plugin/uat/runners/report.ts +150 -0
package/telegram-plugin/uat/runners/run-agent-self-sufficiency.sh +50 -0
package/telegram-plugin/uat/runners/scorer.test.ts +196 -0
package/telegram-plugin/uat/runners/scorer.ts +106 -0
package/telegram-plugin/uat/runners/skill-coverage.test.ts +100 -0
package/telegram-plugin/uat/runners/skill-coverage.ts +620 -0
package/telegram-plugin/uat/scenarios/jtbd-interrupt-marker-dm.test.ts +7 -1
package/telegram-plugin/uat/scenarios/jtbd-rapid-followup-dm.test.ts +7 -1
package/telegram-plugin/auth-dashboard.ts +0 -1104
package/telegram-plugin/auth-slot-parser.ts +0 -497
package/telegram-plugin/auto-fallback-dispatcher.ts +0 -68
package/telegram-plugin/dist/foreman/foreman.js +0 -31358
package/telegram-plugin/foreman/foreman-create-flow.ts +0 -202
package/telegram-plugin/foreman/foreman-handlers.ts +0 -493
package/telegram-plugin/foreman/foreman.ts +0 -1165
package/telegram-plugin/foreman/setup-flow.ts +0 -345
package/telegram-plugin/foreman/setup-state.ts +0 -239
package/telegram-plugin/foreman/state.ts +0 -203
package/telegram-plugin/tests/auth-account-identity-surface.test.ts +0 -118
package/telegram-plugin/tests/auth-dashboard-edge-cases.test.ts +0 -260
package/telegram-plugin/tests/auth-dashboard-restart-flow.test.ts +0 -140
package/telegram-plugin/tests/auth-dashboard-v3b.test.ts +0 -559
package/telegram-plugin/tests/auth-dashboard.test.ts +0 -1045
package/telegram-plugin/tests/auth-slot-commands.test.ts +0 -640
package/telegram-plugin/tests/auto-fallback-dispatcher.e2e.test.ts +0 -183
package/telegram-plugin/tests/boot-card-account-quota.test.ts +0 -137
package/telegram-plugin/tests/foreman-create-flow.test.ts +0 -359
package/telegram-plugin/tests/foreman-handlers.test.ts +0 -347
package/telegram-plugin/tests/foreman-state.test.ts +0 -164
package/telegram-plugin/tests/foreman-write-ops.test.ts +0 -214
package/telegram-plugin/tests/setup-flow.test.ts +0 -510
package/telegram-plugin/tests/setup-state.test.ts +0 -146

package/telegram-plugin/fleet-fallback-gate.ts ADDED Viewed

@@ -0,0 +1,105 @@
+/**
+ * Re-entry guard + dedup window for fleet-wide auto-fallback.
+ *
+ * Lifted out of gateway.ts so the dedup state is constructable per-test
+ * (gateway.ts module state was hard to reach from vitest — every test
+ * shared the same in-flight Promise + last-fired timestamp).
+ *
+ * Contract (the "honesty contract" from PR #1317 review):
+ *
+ *   `wouldFire()` is the SYNCHRONOUS read the model-unavailable card
+ *   uses to decide whether to advertise "Auto-failover in progress".
+ *   It MUST agree with the dispatcher's actual behavior — otherwise
+ *   the card lies (claims a swap is coming when the dispatcher will
+ *   dedup-drop or bail).
+ *
+ *   Three reasons `wouldFire()` returns false:
+ *     1. A swap is already in flight (collapse concurrent fires).
+ *     2. The post-trigger dedup window is still active (the user
+ *        already saw a swap announcement; another one would oscillate).
+ *     3. The broker is unreachable — the dispatcher would just bail
+ *        with `reason=no-broker-client`, leaving the card to lie.
+ *        Optional: only checked when `brokerReachable` is supplied.
+ *
+ *   `markFired()` is called ONLY on actual swaps (kind: 'switched').
+ *   No-ops (no broker, no eligible target, idempotent skip) DO NOT
+ *   arm the suppression window — otherwise a transient hiccup blocks
+ *   the next 30s of legitimate fires.
+ */
+export interface FleetFallbackGateOptions {
+  /** Suppression window in ms after a successful swap. */
+  dedupMs: number;
+  /** Time source (overridable in tests). */
+  nowFn?: () => number;
+  /**
+   * Synchronous probe of broker reachability. Optional. Returning false
+   * makes `wouldFire()` return false so the card stays honest about a
+   * fire that would otherwise bail in the dispatcher.
+   *
+   * Synchronous on purpose: `wouldFire()` runs on the card-render path
+   * and must not block. A connection-cached flag (e.g. a UDS reachability
+   * check populated by a background heartbeat) fits this shape.
+   */
+  brokerReachable?: () => boolean;
+}
+export interface FleetFallbackGate {
+  /** True iff a fresh fire would actually invoke the dispatcher. */
+  wouldFire(): boolean;
+  /** Run a fire-and-forget action under the gate. Collapses concurrent
+   *  callers to the same in-flight Promise. The action's resolved value
+   *  controls whether the dedup window arms (true = arm, false = skip).
+   *  Caller-thrown errors are swallowed (logged via `onError`). */
+  fire(action: () => Promise<boolean>, onError?: (err: unknown) => void): Promise<void>;
+  /** Test seam — reset to fresh state. Production code should not call this. */
+  reset(): void;
+  /** Test/debug — current internal state. */
+  inspect(): { inFlight: boolean; lastFiredAtMs: number };
+}
+export function createFleetFallbackGate(opts: FleetFallbackGateOptions): FleetFallbackGate {
+  const nowFn = opts.nowFn ?? (() => Date.now());
+  let inFlight: Promise<void> | null = null;
+  // -Infinity = never fired. Concrete number = wall-clock ms of the
+  // last actual swap. Sentinel matters in tests (fake clocks at t=0
+  // would otherwise look like "just fired" and falsely arm dedup).
+  let lastFiredAtMs = Number.NEGATIVE_INFINITY;
+  function wouldFire(): boolean {
+    if (inFlight) return false;
+    if (nowFn() - lastFiredAtMs < opts.dedupMs) return false;
+    if (opts.brokerReachable && !opts.brokerReachable()) return false;
+    return true;
+  }
+  function fire(action: () => Promise<boolean>, onError?: (err: unknown) => void): Promise<void> {
+    if (inFlight) return inFlight;
+    if (nowFn() - lastFiredAtMs < opts.dedupMs) return Promise.resolve();
+    if (opts.brokerReachable && !opts.brokerReachable()) return Promise.resolve();
+    inFlight = (async () => {
+      try {
+        const didSwap = await action();
+        if (didSwap) lastFiredAtMs = nowFn();
+      } catch (err) {
+        if (onError) onError(err);
+      } finally {
+        inFlight = null;
+      }
+    })();
+    return inFlight;
+  }
+  return {
+    wouldFire,
+    fire,
+    reset() {
+      inFlight = null;
+      lastFiredAtMs = Number.NEGATIVE_INFINITY;
+    },
+    inspect() {
+      return { inFlight: inFlight !== null, lastFiredAtMs };
+    },
+  };
+}

package/telegram-plugin/gateway/approval-callback.test.ts ADDED Viewed

@@ -0,0 +1,104 @@
+/**
+ * Tests for `buildGrantedKeyboard` — the post-tap inline-keyboard
+ * surfaced on a granted approval card (RFC E §4.3 — granted-card
+ * confirmations gain the [ 📖 Open in Drive ] deep-link button).
+ *
+ * Scope-driven and pure, so the test runs without mocking grammy's
+ * Context or the approval kernel. The full handler in
+ * `approval-callback.ts` glues this onto the consumed-scope payload
+ * the kernel returns; the routing decision lives entirely in this
+ * builder.
+ */
+import { describe, expect, it } from "vitest";
+import { InlineKeyboard } from "grammy";
+import { buildGrantedKeyboard } from "./approval-callback.js";
+/**
+ * Helper — pull the `[{text, url}]` rows out of a grammy InlineKeyboard
+ * so we can assert without poking into its internal shape too hard.
+ */
+function rows(kb: InlineKeyboard): Array<Array<{ text: string; url?: string }>> {
+  return kb.inline_keyboard.map((row) =>
+    row.map((btn) => ({
+      text: btn.text,
+      ...("url" in btn ? { url: btn.url } : {}),
+    })),
+  );
+}
+describe("buildGrantedKeyboard — Drive scopes", () => {
+  it("emits Open-in-Drive for a single-doc grant", () => {
+    const kb = buildGrantedKeyboard("doc:gdrive:D1");
+    expect(kb).toBeDefined();
+    expect(rows(kb!)).toEqual([
+      [
+        {
+          text: "📖 Open in Drive",
+          url: "https://drive.google.com/file/d/D1/view",
+        },
+      ],
+    ]);
+  });
+  it("emits Open-in-Drive for a folder grant (canonical folder URL)", () => {
+    const kb = buildGrantedKeyboard("doc:gdrive:folder/F1/**");
+    expect(kb).toBeDefined();
+    expect(rows(kb!)).toEqual([
+      [
+        {
+          text: "📖 Open in Drive",
+          url: "https://drive.google.com/drive/folders/F1",
+        },
+      ],
+    ]);
+  });
+  it("emits Open-in-Drive for write-namespace grants on a single doc", () => {
+    const kb = buildGrantedKeyboard("doc:gdrive:write:D1");
+    expect(kb).toBeDefined();
+    expect(rows(kb!)).toEqual([
+      [
+        {
+          text: "📖 Open in Drive",
+          url: "https://drive.google.com/file/d/D1/view",
+        },
+      ],
+    ]);
+  });
+  it("emits Open-in-Drive for suggest-namespace folder grants", () => {
+    const kb = buildGrantedKeyboard("doc:gdrive:suggest:folder/F1/**");
+    expect(kb).toBeDefined();
+    expect(rows(kb!)).toEqual([
+      [
+        {
+          text: "📖 Open in Drive",
+          url: "https://drive.google.com/drive/folders/F1",
+        },
+      ],
+    ]);
+  });
+});
+describe("buildGrantedKeyboard — no button cases", () => {
+  it("returns undefined for the whole-Drive grant (no specific artifact)", () => {
+    expect(buildGrantedKeyboard("doc:gdrive:**")).toBeUndefined();
+    expect(buildGrantedKeyboard("doc:gdrive:suggest:**")).toBeUndefined();
+    expect(buildGrantedKeyboard("doc:gdrive:write:**")).toBeUndefined();
+  });
+  it("returns undefined for non-Drive scopes (secrets, system, vault)", () => {
+    expect(buildGrantedKeyboard("secret:OPENAI_API_KEY")).toBeUndefined();
+    expect(buildGrantedKeyboard("system:reconnect:gdrive")).toBeUndefined();
+    expect(buildGrantedKeyboard("vault:read:gdrive:klanker:refresh_token")).toBeUndefined();
+  });
+  it("returns undefined for unparseable Drive scopes (defense in depth)", () => {
+    // A folder id containing a slash slips past prefix matching but is
+    // rejected by parseDriveScope's id-charset check — the granted-card
+    // edit MUST NOT render a URL button derived from such a string.
+    expect(buildGrantedKeyboard("doc:gdrive:folder/abc/def/**")).toBeUndefined();
+    expect(buildGrantedKeyboard("doc:gdrive:write:abc?evil=1")).toBeUndefined();
+  });
+});

package/telegram-plugin/gateway/approval-callback.ts CHANGED Viewed

@@ -21,13 +21,31 @@
  * approval_lookup (RFC §10) to discover the outcome and proceed.
  */
-import type { Context } from "grammy";
+import { type Context, InlineKeyboard } from "grammy";
 import { parseApprovalCallback, ttlMsFromToken } from "./approval-card.js";
 import {
   approvalConsume,
   approvalRecord,
 } from "../../src/vault/approvals/client.js";
 import type { ApprovalDecisionMode } from "../../src/vault/approvals/schema.js";
+import { scopeToOpenInDriveButton } from "../../src/drive/deep-links.js";
+/**
+ * Build the post-tap keyboard for a granted decision. Today this is
+ * just the `[ 📖 Open in Drive ]` button when the granted scope names
+ * a specific Drive doc or folder (RFC E §4.3 — granted-card
+ * confirmations gain the deep-link). Returns `undefined` when no
+ * post-tap keyboard applies, which the gateway translates into
+ * `reply_markup: undefined` to strip the original action buttons.
+ *
+ * Pure / scope-driven — no kernel I/O — so it stays unit-testable
+ * without mocking grammy's Context.
+ */
+export function buildGrantedKeyboard(scope: string): InlineKeyboard | undefined {
+  const btn = scopeToOpenInDriveButton(scope);
+  if (btn === null) return undefined;
+  return new InlineKeyboard().url(btn.text, btn.url);
+}
 export async function handleApprovalCallback(
   ctx: Context,
@@ -109,7 +127,10 @@ export async function handleApprovalCallback(
     return;
   }
-  // Edit the original card to its post-tap state and drop the keyboard.
+  // Edit the original card to its post-tap state. Drop the original
+  // action keyboard either way; on a successful grant for a Drive
+  // scope, surface `[ 📖 Open in Drive ]` so the user can jump
+  // straight from "agent has access" to the doc (RFC E §4.3).
   const icon = granted ? "✅" : "🚫";
   const newBody =
     `${icon} ${displayMode}` +
@@ -117,8 +138,15 @@ export async function handleApprovalCallback(
       ? ` · /approvals revoke <code>${decision_id}</code>`
       : "");
+  const postTapKeyboard = granted && consumed.scope
+    ? buildGrantedKeyboard(consumed.scope)
+    : undefined;
   try {
-    await ctx.editMessageText(newBody, { parse_mode: "HTML", reply_markup: undefined });
+    await ctx.editMessageText(newBody, {
+      parse_mode: "HTML",
+      reply_markup: postTapKeyboard,
+    });
   } catch {
     // Best-effort: card may have been edited or deleted under us.
   }

package/telegram-plugin/gateway/auth-add-flow.ts ADDED Viewed

@@ -0,0 +1,326 @@
+/**
+ * `/auth add <label>` Telegram chat flow (RFC H §4.3 add-account, §7.3).
+ *
+ * The headline use case: every account on the fleet is rate-limited,
+ * the LLM is unreachable, and the operator is on their phone. They
+ * need a deterministic — LLM-free — chat path to add a fresh Anthropic
+ * OAuth account. This module owns that flow end-to-end:
+ *
+ *   1. Operator sends `/auth add <label>`.
+ *   2. Gateway calls {@link startAccountAuthSession} → spawns
+ *      `claude setup-token` against a scratch directory under
+ *      `~/.switchroom/accounts/.in-progress/<label>-<rand>/`, captures
+ *      the OAuth authorize URL, and tucks pending state into
+ *      {@link pendingAuthAddFlows}.
+ *   3. Gateway replies to chat with the URL + paste instructions.
+ *   4. Operator opens URL, logs in, copies the browser code, pastes
+ *      into chat. Gateway's `pendingReauthFlows`-style intercept
+ *      catches the paste and calls {@link submitAccountAuthCode}.
+ *   5. Helper reads `<scratch>/.credentials.json` (the dotfile that
+ *      `claude setup-token` writes on success — pinned in
+ *      `src/auth/broker/server-add-account.test.ts`), builds the
+ *      {@link AddAccountCredentials} payload, and the gateway calls
+ *      broker `addAccount(label, credentials, replace=false)`.
+ *   6. Scratch dir is wiped on every code path — success, cancel,
+ *      paste-failure, TTL timeout, gateway shutdown.
+ *
+ * Why a separate module (vs reusing `src/auth/manager.ts`):
+ *
+ *   - `startAuthSession` writes `<agentDir>/.claude/.setup-token.session.json`
+ *     and is built around the per-agent OAuth flow. The `/auth add`
+ *     flow has no agent — the resulting credentials become a
+ *     broker-managed account that any agent can be set to. Threading
+ *     `agentDir` through it would corrupt the agent's own auth state
+ *     if the operator's add-flow collides with a normal reauth.
+ *   - The chat-flow surface is deterministic and stateless beyond
+ *     `pendingAuthAddFlows`. Reusing the full manager would inherit
+ *     legacy slot logic, tmp-dir cleanup heuristics, and stale-session
+ *     detection that doesn't apply when each `/auth add` creates a
+ *     fresh, unguessable scratch dir of its own.
+ *
+ * What we DO reuse: the pure parsing helpers — `parseSetupTokenUrl`
+ * (handles both claude.ai/oauth and claude.com/cai/oauth shapes),
+ * `extractCodeChallenge` (PKCE stale-session detection), and
+ * `readTokenFromCredentialsFile` (validates the `sk-ant-oat...` token
+ * shape). Those are label-agnostic.
+ *
+ * **Hard rule: NEVER touch the agent's claude process.** This flow runs
+ * as a deterministic chat handler in the gateway. The URL goes straight
+ * to chat via `bot.api.sendMessage`. The code paste is intercepted by
+ * the gateway, never forwarded to the agent's bridge. If every account
+ * on the fleet is rate-limited the LLM is unreachable — that's the
+ * whole point of the flow existing.
+ */
+import { spawn, type ChildProcess } from 'node:child_process'
+import { existsSync, mkdirSync, readFileSync, rmSync } from 'node:fs'
+import { homedir } from 'node:os'
+import { join } from 'node:path'
+import { randomBytes } from 'node:crypto'
+import {
+  parseSetupTokenUrl,
+  readTokenFromCredentialsFile,
+} from '../../src/auth/manager.js'
+import type {
+  AddAccountCredentials,
+  AnthropicAddAccountCredentials,
+} from '../../src/auth/broker/client.js'
+/* ── Pending-state map ────────────────────────────────────────────────── */
+/**
+ * In-flight `/auth add` flow keyed by Telegram chat id. The gateway's
+ * generic message intercept (sibling to `pendingReauthFlows`) reads
+ * this map to decide whether a sk-ant-…-shaped paste belongs to an
+ * add flow or to a reauth flow.
+ *
+ * TTL matches `REAUTH_INTERCEPT_TTL_MS` (10 minutes); the reaper sweep
+ * in gateway.ts walks both maps each minute.
+ */
+export interface PendingAuthAddFlow {
+  label: string
+  scratchDir: string
+  /** PID of the spawned `claude setup-token` process, for cancel-kill. */
+  child: ChildProcess
+  startedAt: number
+}
+export const pendingAuthAddFlows = new Map<string, PendingAuthAddFlow>()
+/* ── Scratch dir lifecycle ────────────────────────────────────────────── */
+/**
+ * Pick a fresh scratch path under
+ * `~/.switchroom/accounts/.in-progress/<label>-<rand>/`.
+ *
+ * The leading dot keeps the dir hidden from `listAccounts(home)` in
+ * `src/auth/account-store.ts`, which enumerates accounts by scanning
+ * `~/.switchroom/accounts/`. That listing is the source of truth for
+ * broker `list-state` — a half-written add-in-progress must NOT
+ * appear there. `.in-progress/` is also outside the broker's
+ * managed-artifact whitelist, so a stray dir won't blow up on the
+ * next apply.
+ *
+ * Random suffix is 8 bytes of crypto-grade randomness so:
+ *   - two concurrent operators adding the same label can't collide
+ *     on the scratch path
+ *   - an attacker watching `~/.switchroom/accounts/.in-progress/`
+ *     can't predict the next dir name and squat a symlink
+ */
+export function pickScratchDir(label: string, home: string = homedir()): string {
+  const suffix = randomBytes(8).toString('hex')
+  return join(home, '.switchroom', 'accounts', '.in-progress', `${label}-${suffix}`)
+}
+/**
+ * Best-effort scratch-dir wipe. Used on every exit path — success,
+ * cancel, timeout, error. Synchronous because the caller has already
+ * settled the user-facing reply by the time we get here; an extra
+ * tick of latency is not worth event-loop juggling.
+ */
+export function cleanScratchDir(scratchDir: string): void {
+  try {
+    rmSync(scratchDir, { recursive: true, force: true })
+  } catch {
+    // best-effort
+  }
+}
+/* ── Subprocess lifecycle ─────────────────────────────────────────────── */
+export interface StartAccountAuthSessionResult {
+  loginUrl: string
+  scratchDir: string
+  child: ChildProcess
+}
+/**
+ * Spawn `claude setup-token` against a fresh scratch directory and
+ * resolve once the authorize URL has been parsed from its stdout/stderr.
+ *
+ * Why we *don't* use tmux: the `submitAuthCode` path in
+ * `src/auth/manager.ts` uses tmux because that flow is interactive —
+ * an operator on a host can `tmux attach` to inspect the auth prompt
+ * if anything goes wrong. The chat flow has no equivalent escape
+ * hatch (the operator is on their phone) and a pipe-based subprocess
+ * is far easier to lifecycle-manage from a long-running gateway. We
+ * write the code to the child's stdin in {@link submitAccountAuthCode}.
+ *
+ * The child is left running between {@link startAccountAuthSession}
+ * and {@link submitAccountAuthCode} — closing stdin before the code
+ * is pasted would tear down the OAuth session.
+ *
+ * Timeout default: 12 seconds to see the URL. claude setup-token
+ * typically prints the URL within ~3–5s; 12s covers an unloaded VM
+ * with slow startup. Caller passes the timeout via opts so tests can
+ * shorten it.
+ */
+export async function startAccountAuthSession(
+  label: string,
+  opts: {
+    home?: string
+    urlTimeoutMs?: number
+    /** Override the binary name (tests). */
+    claudeBinary?: string
+  } = {},
+): Promise<StartAccountAuthSessionResult> {
+  const home = opts.home ?? homedir()
+  const urlTimeoutMs = opts.urlTimeoutMs ?? 12_000
+  const binary = opts.claudeBinary ?? 'claude'
+  const scratchDir = pickScratchDir(label, home)
+  mkdirSync(scratchDir, { recursive: true, mode: 0o700 })
+  // BROWSER=/bin/true: same rationale as src/auth/manager.ts's
+  // startAuthSession — suppress claude setup-token's host-side browser
+  // auto-launch (would land on Claude's login page with no cookies on
+  // a headless box). The chat flow is paste-only.
+  const child = spawn(binary, ['setup-token'], {
+    env: {
+      ...process.env,
+      CLAUDE_CONFIG_DIR: scratchDir,
+      BROWSER: '/bin/true',
+    },
+    stdio: ['pipe', 'pipe', 'pipe'],
+  })
+  // Aggregate stdout+stderr; the URL can land on either channel
+  // depending on claude CLI version.
+  let buffer = ''
+  const collect = (chunk: Buffer): void => {
+    buffer += chunk.toString('utf8')
+  }
+  child.stdout?.on('data', collect)
+  child.stderr?.on('data', collect)
+  // Race: URL detection vs timeout vs child exit before URL appeared.
+  const loginUrl = await new Promise<string>((resolve, reject) => {
+    const deadline = setTimeout(() => {
+      cleanup()
+      reject(new Error(`claude setup-token did not print an OAuth URL within ${urlTimeoutMs}ms`))
+    }, urlTimeoutMs)
+    const tick = setInterval(() => {
+      const url = parseSetupTokenUrl(buffer)
+      if (url) {
+        cleanup()
+        resolve(url)
+      }
+    }, 200)
+    const onExit = (code: number | null): void => {
+      cleanup()
+      reject(new Error(`claude setup-token exited (code ${code}) before printing OAuth URL`))
+    }
+    child.once('exit', onExit)
+    function cleanup(): void {
+      clearTimeout(deadline)
+      clearInterval(tick)
+      child.removeListener('exit', onExit)
+    }
+  }).catch((err) => {
+    // Kill the child and wipe the scratch dir before re-raising so
+    // failed-to-start sessions don't leak.
+    try { child.kill('SIGTERM') } catch { /* best-effort */ }
+    cleanScratchDir(scratchDir)
+    throw err
+  })
+  return { loginUrl, scratchDir, child }
+}
+/**
+ * Paste the operator's browser code into the live `claude setup-token`
+ * child's stdin and wait for the success-written credentials.json.
+ *
+ * Returns the `AddAccountCredentials` shape the broker's add-account
+ * verb expects — same `claudeAiOauth: { accessToken, refreshToken,
+ * expiresAt, scopes, subscriptionType, rateLimitTier }` envelope.
+ *
+ * On success: the caller is responsible for invoking
+ * `cleanScratchDir(scratchDir)` after `addAccount` returns; we
+ * deliberately don't wipe here because the broker call might race the
+ * filesystem cleanup. On failure (invalid code, expired code, timeout)
+ * the helper throws and cleans the scratch dir itself.
+ *
+ * Poll interval default: 250ms — same as `submitAuthCode`'s 500ms
+ * halved because there's no tmux capture-pane overhead per tick.
+ * Timeout default: 120s, matching the env var in `submitAuthCode`.
+ */
+export async function submitAccountAuthCode(
+  flow: PendingAuthAddFlow,
+  code: string,
+  opts: { pollIntervalMs?: number; pollTimeoutMs?: number } = {},
+): Promise<AddAccountCredentials> {
+  const pollIntervalMs = opts.pollIntervalMs ?? 250
+  const pollTimeoutMs = opts.pollTimeoutMs ?? 120_000
+  const credentialsPath = join(flow.scratchDir, '.credentials.json')
+  // Write the code + newline to stdin. claude setup-token's prompt
+  // expects line-buffered input — see the manual-paste paste at the
+  // bottom of `submitAuthCode`. We use a single write here (vs the
+  // two send-keys calls of the tmux path) because there's no
+  // terminfo-flake concern over a pipe.
+  if (!flow.child.stdin || flow.child.stdin.destroyed) {
+    cleanScratchDir(flow.scratchDir)
+    throw new Error('claude setup-token process stdin is not writable (child may have exited)')
+  }
+  flow.child.stdin.write(code.trim() + '\n')
+  // Poll for the credentials file. Same two-channel design as
+  // submitAuthCode but tmux-pane-scrape and log-scrape are out (the
+  // pane scrape was a fallback for older claude CLI versions; the
+  // chat flow targets the current CLI by definition).
+  const deadline = Date.now() + pollTimeoutMs
+  while (Date.now() < deadline) {
+    await new Promise((r) => setTimeout(r, pollIntervalMs))
+    if (existsSync(credentialsPath)) {
+      const token = readTokenFromCredentialsFile(credentialsPath)
+      if (token) {
+        // Parse the full credentials envelope to forward to the
+        // broker. readTokenFromCredentialsFile already validated the
+        // accessToken regex, so the JSON is well-formed.
+        try {
+          const raw = readFileSync(credentialsPath, 'utf-8')
+          const parsed = JSON.parse(raw) as { claudeAiOauth?: AnthropicAddAccountCredentials['claudeAiOauth'] }
+          if (parsed.claudeAiOauth?.accessToken) {
+            // Drain the child so it exits cleanly after success.
+            try { flow.child.stdin?.end() } catch { /* best-effort */ }
+            return { claudeAiOauth: parsed.claudeAiOauth }
+          }
+        } catch {
+          // fall through — file may be mid-write; next tick retries.
+        }
+      }
+    }
+    // Detect child early exit (invalid code → claude prints + exits).
+    if (flow.child.exitCode != null) {
+      cleanScratchDir(flow.scratchDir)
+      throw new Error(
+        `claude setup-token exited (code ${flow.child.exitCode}) — code may have been invalid or expired`,
+      )
+    }
+  }
+  // Timeout — kill the child + wipe scratch.
+  try { flow.child.kill('SIGTERM') } catch { /* best-effort */ }
+  cleanScratchDir(flow.scratchDir)
+  throw new Error(`No credentials file appeared at ${credentialsPath} within ${Math.round(pollTimeoutMs / 1000)}s`)
+}
+/**
+ * Cancel an in-flight `/auth add` flow: kill the `claude setup-token`
+ * child, wipe the scratch dir, and let the caller delete the
+ * `pendingAuthAddFlows` entry. Idempotent — safe to call when the
+ * child has already exited.
+ */
+export function cancelAccountAuthSession(flow: PendingAuthAddFlow): void {
+  try {
+    if (flow.child.exitCode == null) flow.child.kill('SIGTERM')
+  } catch {
+    // best-effort
+  }
+  cleanScratchDir(flow.scratchDir)
+}

package/telegram-plugin/gateway/auth-broker-client.ts ADDED Viewed

@@ -0,0 +1,75 @@
+/**
+ * Thin adapter between the gateway and `src/auth/broker/client.ts`.
+ *
+ * The broker client is a stateful class (holds a persistent UDS
+ * connection). The gateway constructs one per `/auth` command —
+ * cheap, and avoids dangling sockets on idle. The handler needs the
+ * five methods on the `AuthBrokerClient` interface in
+ * `./auth-command.ts` (listState / setActive / rmAccount /
+ * refreshAccount / setOverride); we narrow `BrokerClient` down to
+ * that surface so a test mock only has to stub those five.
+ */
+import { AuthBrokerClient as BrokerClient, type AddAccountCredentials } from '../../src/auth/broker/client.js'
+import type { AuthBrokerClient } from './auth-command.js'
+/**
+ * Construct an {@link AuthBrokerClient} for one `/auth` command. The
+ * caller is responsible for closing the underlying socket when done
+ * (do `await client.close()` after the reply lands).
+ */
+export function createAuthBrokerClient(): {
+  client: AuthBrokerClient
+  close: () => Promise<void>
+} {
+  const broker = new BrokerClient()
+  const client: AuthBrokerClient = {
+    listState: () => broker.listState(),
+    setActive: (label: string) => broker.setActive(label),
+    rmAccount: (label: string) => broker.rmAccount(label),
+    refreshAccount: (label: string) => broker.refreshAccount(label),
+    setOverride: (agent: string, account: string | null) =>
+      broker.setOverride(agent, account),
+  }
+  return { client, close: () => broker.close() }
+}
+/**
+ * Legacy `getAuthBrokerClient` entry — kept so the gateway's existing
+ * call site doesn't need rewiring. Returns the client object only;
+ * the underlying socket leaks unless the caller imports
+ * `createAuthBrokerClient` directly. Acceptable because:
+ *   - The gateway is long-lived (one process per agent).
+ *   - The broker tolerates many connections per peer.
+ *   - `/auth` is a low-frequency human-driven verb.
+ *
+ * If allocations become a concern, swap callers over to the structured
+ * variant above.
+ */
+export async function getAuthBrokerClient(
+  _agentName: string,
+): Promise<AuthBrokerClient | null> {
+  const { client } = createAuthBrokerClient()
+  return client
+}
+/**
+ * Add an account via the broker. Used exclusively by the `/auth add`
+ * chat flow — the narrow {@link AuthBrokerClient} surface in
+ * `auth-command.ts` deliberately omits `addAccount` because the verb
+ * is gateway-routed (not handler-routed). Constructs and closes a
+ * one-shot {@link BrokerClient} so the gateway doesn't need a
+ * long-lived handle just for this verb.
+ */
+export async function addAccountViaBroker(
+  label: string,
+  credentials: AddAccountCredentials,
+  opts: { replace?: boolean } = {},
+): Promise<{ label: string; expiresAt?: number }> {
+  const broker = new BrokerClient()
+  try {
+    return await broker.addAccount(label, credentials, opts.replace)
+  } finally {
+    await broker.close()
+  }
+}