npm - switchroom - Versions diffs - 0.7.15 → 0.10.0 - Mend

switchroom 0.7.15 → 0.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (301) hide show

package/README.md +51 -59
package/bin/run-hook.sh +27 -11
package/bin/timezone-hook.sh +9 -7
package/dist/agent-scheduler/index.js +410 -133
package/dist/auth-broker/index.js +13932 -0
package/dist/cli/switchroom.js +26937 -5601
package/dist/host-control/main.js +12702 -0
package/dist/vault/approvals/kernel-server.js +467 -184
package/dist/vault/broker/server.js +1430 -724
package/examples/minimal.yaml +63 -0
package/examples/personal-google-workspace-mcp/.env.example +34 -0
package/examples/personal-google-workspace-mcp/README.md +194 -0
package/examples/personal-google-workspace-mcp/compose.yaml +66 -0
package/examples/switchroom.yaml +220 -0
package/package.json +7 -4
package/profiles/_base/settings.json.hbs +20 -5
package/profiles/_base/start.sh.hbs +16 -3
package/profiles/_shared/agent-self-service.md.hbs +126 -0
package/profiles/_shared/telegram-style.md.hbs +20 -90
package/profiles/_shared/vault-protocol.md.hbs +68 -0
package/profiles/default/CLAUDE.md +50 -96
package/profiles/default/CLAUDE.md.hbs +36 -6
package/profiles/default/workspace/SOUL.md.hbs +12 -5
package/skills/buildkite-agent-infrastructure/SKILL.md +30 -11
package/skills/buildkite-agent-runtime/SKILL.md +44 -11
package/skills/buildkite-api/SKILL.md +31 -8
package/skills/buildkite-cli/SKILL.md +27 -9
package/skills/buildkite-migration/SKILL.md +22 -9
package/skills/buildkite-pipelines/SKILL.md +26 -9
package/skills/buildkite-secure-delivery/SKILL.md +23 -9
package/skills/buildkite-test-engine/SKILL.md +25 -8
package/skills/docx/SKILL.md +1 -1
package/skills/docx/scripts/office/validators/__pycache__/__init__.cpython-313.pyc +0 -0
package/skills/docx/scripts/office/validators/__pycache__/base.cpython-313.pyc +0 -0
package/skills/file-bug/SKILL.md +34 -6
package/skills/humanizer/SKILL.md +15 -0
package/skills/humanizer-calibrate/SKILL.md +7 -1
package/skills/mcp-builder/SKILL.md +1 -1
package/skills/pdf/SKILL.md +1 -1
package/skills/pptx/SKILL.md +1 -1
package/skills/skill-creator/SKILL.md +21 -1
package/skills/skill-creator/scripts/__pycache__/__init__.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/generate_report.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/improve_description.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/run_eval.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/run_loop.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/utils.cpython-313.pyc +0 -0
package/skills/switchroom-cli/SKILL.md +63 -64
package/skills/switchroom-health/SKILL.md +23 -10
package/skills/switchroom-install/SKILL.md +3 -3
package/skills/switchroom-manage/SKILL.md +26 -19
package/skills/switchroom-runtime/SKILL.md +191 -0
package/skills/switchroom-status/SKILL.md +27 -2
package/skills/telegram-test-harness/SKILL.md +3 -0
package/skills/token-helpers/SKILL.md +24 -1
package/skills/webapp-testing/SKILL.md +31 -1
package/skills/xlsx/SKILL.md +1 -1
package/telegram-plugin/admin-commands/index.ts +7 -5
package/telegram-plugin/analytics-posthog.ts +191 -0
package/telegram-plugin/bridge/bridge.ts +69 -0
package/telegram-plugin/bridge/ipc-client.ts +4 -1
package/telegram-plugin/dist/bridge/bridge.js +194 -119
package/telegram-plugin/dist/gateway/gateway.js +23611 -19671
package/telegram-plugin/dist/server.js +245 -189
package/telegram-plugin/first-paint.ts +3 -24
package/telegram-plugin/gateway/auth-add-flow.ts +326 -0
package/telegram-plugin/gateway/auth-broker-client.ts +75 -0
package/telegram-plugin/gateway/auth-command.ts +794 -0
package/telegram-plugin/gateway/auth-line.ts +123 -0
package/telegram-plugin/gateway/boot-card.ts +169 -40
package/telegram-plugin/gateway/boot-issue-cache.ts +308 -0
package/telegram-plugin/gateway/boot-probes.ts +166 -123
package/telegram-plugin/gateway/boot-reason.ts +41 -7
package/telegram-plugin/gateway/boot-version.ts +66 -0
package/telegram-plugin/gateway/gateway.ts +3499 -1885
package/telegram-plugin/gateway/hostd-dispatch.ts +117 -0
package/telegram-plugin/gateway/ipc-protocol.ts +18 -0
package/telegram-plugin/gateway/pending-inbound-buffer.ts +106 -0
package/telegram-plugin/gateway/quarantine.ts +69 -0
package/telegram-plugin/gateway/quota-cache.ts +9 -4
package/telegram-plugin/gateway/reaction-trigger.ts +401 -0
package/telegram-plugin/gateway/recent-denials.test.ts +103 -0
package/telegram-plugin/gateway/recent-denials.ts +77 -0
package/telegram-plugin/gateway/startup-network-retry.ts +109 -31
package/telegram-plugin/gateway/vault-grant-inbound-builders.ts +125 -0
package/telegram-plugin/history.ts +91 -0
package/telegram-plugin/hooks/hooks.json +10 -0
package/telegram-plugin/hooks/sandbox-hint-posttool.mjs +130 -0
package/telegram-plugin/hooks/subagent-tracker-posttool.mjs +19 -2
package/telegram-plugin/hooks/subagent-tracker-pretool.mjs +22 -2
package/telegram-plugin/hooks/tool-label-pretool.mjs +11 -0
package/telegram-plugin/hooks/wedge-detect-posttool.mjs +303 -0
package/telegram-plugin/inbound-classifier.ts +50 -0
package/telegram-plugin/inline-keyboard-callbacks.ts +136 -0
package/telegram-plugin/node_modules/.vite/vitest/da39a3ee5e6b4b0d3255bfef95601890afd80709/results.json +1 -0
package/telegram-plugin/package.json +4 -2
package/telegram-plugin/permission-rule.ts +51 -0
package/telegram-plugin/permission-title.ts +56 -0
package/telegram-plugin/quota-check.ts +19 -41
package/telegram-plugin/registry/reaper.ts +223 -0
package/telegram-plugin/retry-api-call.ts +80 -0
package/telegram-plugin/runtime-metrics.ts +177 -0
package/telegram-plugin/scripts/build.mjs +0 -1
package/telegram-plugin/secret-detect/index.ts +24 -0
package/telegram-plugin/secret-detect/vault-error.test.ts +64 -12
package/telegram-plugin/secret-detect/vault-error.ts +78 -11
package/telegram-plugin/secret-detect/vault-write.ts +14 -2
package/telegram-plugin/server.js +41795 -0
package/telegram-plugin/session-tail.ts +6 -1
package/telegram-plugin/shared/bot-runtime.ts +5 -4
package/telegram-plugin/silence-poke.ts +420 -0
package/telegram-plugin/silent-end.ts +174 -0
package/telegram-plugin/stream-controller.ts +13 -0
package/telegram-plugin/stream-reply-handler.ts +7 -0
package/telegram-plugin/subagent-watcher.ts +213 -4
package/telegram-plugin/tests/auth-add-flow.test.ts +559 -0
package/telegram-plugin/tests/auth-code-redact.test.ts +8 -4
package/telegram-plugin/tests/auth-command-vernacular.test.ts +531 -0
package/telegram-plugin/tests/boot-card-issue-dedup.test.ts +247 -0
package/telegram-plugin/tests/boot-card-reason-to-render.test.ts +182 -0
package/telegram-plugin/tests/boot-card-reason.test.ts +65 -2
package/telegram-plugin/tests/boot-card-render.test.ts +146 -0
package/telegram-plugin/tests/boot-card-silent-on-operator.test.ts +103 -0
package/telegram-plugin/tests/boot-probes.test.ts +216 -10
package/telegram-plugin/tests/boot-version-string.test.ts +0 -0
package/telegram-plugin/tests/finalize-callback.test.ts +190 -0
package/telegram-plugin/tests/gateway-message-validator.test.ts +26 -0
package/telegram-plugin/tests/gateway-secret-detect.test.ts +12 -3
package/telegram-plugin/tests/gateway-startup-network-retry.test.ts +104 -0
package/telegram-plugin/tests/history-reaper.test.ts +378 -0
package/telegram-plugin/tests/hostd-dispatch.test.ts +129 -0
package/telegram-plugin/tests/inbound-classifier.test.ts +76 -0
package/telegram-plugin/tests/inbound-message-types.test.ts +267 -0
package/telegram-plugin/tests/issues-card.test.ts +49 -0
package/telegram-plugin/tests/pending-inbound-buffer.test.ts +132 -0
package/telegram-plugin/tests/permission-rule.test.ts +80 -1
package/telegram-plugin/tests/permission-title.test.ts +31 -0
package/telegram-plugin/tests/quota-check.test.ts +5 -35
package/telegram-plugin/tests/races.test.ts +179 -0
package/telegram-plugin/tests/reaction-trigger-flow.test.ts +353 -0
package/telegram-plugin/tests/reaction-trigger.test.ts +397 -0
package/telegram-plugin/tests/retry-api-call.test.ts +152 -1
package/telegram-plugin/tests/runtime-metrics.test.ts +145 -0
package/telegram-plugin/tests/sandbox-hint-posttool.test.ts +155 -0
package/telegram-plugin/tests/secret-detect-delete-must-surface-failures.test.ts +133 -0
package/telegram-plugin/tests/secret-detect-false-positives.test.ts +137 -0
package/telegram-plugin/tests/silence-poke.test.ts +493 -0
package/telegram-plugin/tests/silent-end.test.ts +206 -0
package/telegram-plugin/tests/subagent-tracker-hooks.test.ts +107 -0
package/telegram-plugin/tests/subagent-watcher-env-thresholds.test.ts +224 -0
package/telegram-plugin/tests/subagent-watcher-stall-terminal.test.ts +316 -0
package/telegram-plugin/tests/subagent-watcher.test.ts +263 -0
package/telegram-plugin/tests/turn-signal-tracker.test.ts +81 -0
package/telegram-plugin/tests/vault-approval-posture.test.ts +256 -0
package/telegram-plugin/tests/vault-grant-auto-resume.test.ts +73 -0
package/telegram-plugin/tests/vault-grant-inbound-builders.test.ts +226 -0
package/telegram-plugin/tests/vault-grant-union.test.ts +130 -0
package/telegram-plugin/tests/vault-key-regex-allows-slash.test.ts +140 -0
package/telegram-plugin/tests/vault-posture-quarantine.test.ts +104 -0
package/telegram-plugin/tests/vault-request-access-tool.test.ts +114 -0
package/telegram-plugin/tests/vault-request-access-unlock-resume.test.ts +106 -0
package/telegram-plugin/turn-signal-tracker.ts +100 -24
package/telegram-plugin/uat/SETUP.md +210 -35
package/telegram-plugin/uat/assertions.ts +264 -37
package/telegram-plugin/uat/driver-info.ts +57 -0
package/telegram-plugin/uat/driver.ts +590 -51
package/telegram-plugin/uat/harness.ts +140 -94
package/telegram-plugin/uat/load-env.test.ts +72 -0
package/telegram-plugin/uat/load-env.ts +48 -0
package/telegram-plugin/uat/login.ts +96 -53
package/telegram-plugin/uat/runners/agent-self-sufficiency.ts +457 -0
package/telegram-plugin/uat/runners/paraphrases.ts +231 -0
package/telegram-plugin/uat/runners/report.ts +150 -0
package/telegram-plugin/uat/runners/run-agent-self-sufficiency.sh +50 -0
package/telegram-plugin/uat/runners/scorer.test.ts +196 -0
package/telegram-plugin/uat/runners/scorer.ts +106 -0
package/telegram-plugin/uat/runners/skill-coverage.test.ts +100 -0
package/telegram-plugin/uat/runners/skill-coverage.ts +620 -0
package/telegram-plugin/uat/scenarios/ask-user-button-tap-dm.test.ts +141 -0
package/telegram-plugin/uat/scenarios/bg-sub-agent-dispatch-dm.test.ts +191 -0
package/telegram-plugin/uat/scenarios/fuzz-extended-dm.test.ts +255 -0
package/telegram-plugin/uat/scenarios/fuzz-human-style-dm.test.ts +275 -0
package/telegram-plugin/uat/scenarios/fuzz-random-prompts-dm.test.ts +146 -0
package/telegram-plugin/uat/scenarios/fuzz-status-ask-dm.test.ts +486 -0
package/telegram-plugin/uat/scenarios/jtbd-interrupt-marker-dm.test.ts +67 -0
package/telegram-plugin/uat/scenarios/jtbd-rapid-followup-dm.test.ts +100 -0
package/telegram-plugin/uat/scenarios/jtbd-soft-commit-dm.test.ts +67 -0
package/telegram-plugin/uat/scenarios/jtbd-status-query-dm.test.ts +49 -0
package/telegram-plugin/uat/scenarios/location-inbound-dm.test.ts +65 -0
package/telegram-plugin/uat/scenarios/midturn-silent-dm.test.ts +175 -0
package/telegram-plugin/uat/scenarios/reactions-dm.test.ts +142 -0
package/telegram-plugin/uat/scenarios/reactions-trigger-turn-dm.test.ts +96 -0
package/telegram-plugin/uat/scenarios/secret-redaction-deletes-original-dm.test.ts +123 -0
package/telegram-plugin/uat/scenarios/secret-redaction-no-false-positive-dm.test.ts +87 -0
package/telegram-plugin/uat/scenarios/silence-poke-soft-dm.test.ts +155 -0
package/telegram-plugin/uat/scenarios/silent-end-recovery-dm.test.ts +95 -0
package/telegram-plugin/uat/scenarios/smoke-dm-reply.test.ts +57 -0
package/telegram-plugin/uat/scenarios/subagent-watcher-no-rerun-dm.test.ts +135 -0
package/telegram-plugin/uat/scenarios/vault-approval-posture-telegram-id-dm.test.ts +191 -0
package/telegram-plugin/uat/scenarios/vault-audit-allow-dm.test.ts +108 -0
package/telegram-plugin/uat/scenarios/vault-grant-auto-resume-dm.test.ts +121 -0
package/telegram-plugin/uat/scenarios/vault-request-access-concurrent-dm.test.ts +161 -0
package/telegram-plugin/uat/scenarios/vault-request-access-end-to-end-dm.test.ts +158 -0
package/telegram-plugin/uat/scenarios/voice-inbound-dm.test.ts +65 -0
package/telegram-plugin/vault-approval-posture.ts +42 -0
package/telegram-plugin/welcome-text.ts +1 -0
package/telegram-plugin/active-pins-sweep.ts +0 -204
package/telegram-plugin/active-pins.ts +0 -146
package/telegram-plugin/auth-dashboard.ts +0 -1104
package/telegram-plugin/auth-slot-parser.ts +0 -497
package/telegram-plugin/card-event-log.ts +0 -138
package/telegram-plugin/dist/foreman/foreman.js +0 -31106
package/telegram-plugin/docs/multi-agent-card-design.md +0 -847
package/telegram-plugin/docs/pinned-progress-card-reliability.md +0 -144
package/telegram-plugin/foreman/foreman-create-flow.ts +0 -202
package/telegram-plugin/foreman/foreman-handlers.ts +0 -493
package/telegram-plugin/foreman/foreman.ts +0 -1165
package/telegram-plugin/foreman/setup-flow.ts +0 -345
package/telegram-plugin/foreman/setup-state.ts +0 -239
package/telegram-plugin/foreman/state.ts +0 -203
package/telegram-plugin/pin-event-log.ts +0 -76
package/telegram-plugin/progress-card-driver.ts +0 -2886
package/telegram-plugin/progress-card-pin-manager.ts +0 -589
package/telegram-plugin/progress-card-pin-watchdog.ts +0 -98
package/telegram-plugin/progress-card.ts +0 -1409
package/telegram-plugin/tests/HARNESS.md +0 -340
package/telegram-plugin/tests/_progress-card-harness.ts +0 -109
package/telegram-plugin/tests/active-pins-boot-reaper.test.ts +0 -211
package/telegram-plugin/tests/active-pins-sweep.test.ts +0 -309
package/telegram-plugin/tests/active-pins.test.ts +0 -187
package/telegram-plugin/tests/auth-account-identity-surface.test.ts +0 -118
package/telegram-plugin/tests/auth-dashboard-edge-cases.test.ts +0 -260
package/telegram-plugin/tests/auth-dashboard-restart-flow.test.ts +0 -140
package/telegram-plugin/tests/auth-dashboard-v3b.test.ts +0 -559
package/telegram-plugin/tests/auth-dashboard.test.ts +0 -1045
package/telegram-plugin/tests/auth-slot-commands.test.ts +0 -640
package/telegram-plugin/tests/bg-agent-progress-card-757.test.ts +0 -201
package/telegram-plugin/tests/boot-card-account-quota.test.ts +0 -137
package/telegram-plugin/tests/card-event-log.test.ts +0 -145
package/telegram-plugin/tests/first-paint.test.ts +0 -257
package/telegram-plugin/tests/foreman-create-flow.test.ts +0 -359
package/telegram-plugin/tests/foreman-handlers.test.ts +0 -347
package/telegram-plugin/tests/foreman-state.test.ts +0 -164
package/telegram-plugin/tests/foreman-write-ops.test.ts +0 -214
package/telegram-plugin/tests/harness-ordering-invariants.test.ts +0 -243
package/telegram-plugin/tests/pin-event-log.test.ts +0 -124
package/telegram-plugin/tests/progress-card-api-failure-during-deferred.test.ts +0 -73
package/telegram-plugin/tests/progress-card-close-paths-converge.test.ts +0 -272
package/telegram-plugin/tests/progress-card-cross-turn.test.ts +0 -258
package/telegram-plugin/tests/progress-card-delay-842.test.ts +0 -160
package/telegram-plugin/tests/progress-card-dispose-preservepending.test.ts +0 -81
package/telegram-plugin/tests/progress-card-draft-flag.test.ts +0 -80
package/telegram-plugin/tests/progress-card-driver-eviction.test.ts +0 -215
package/telegram-plugin/tests/progress-card-driver-fleet-shadow.test.ts +0 -123
package/telegram-plugin/tests/progress-card-driver-force-complete-parent-done.test.ts +0 -76
package/telegram-plugin/tests/progress-card-edit-timestamps-budget.test.ts +0 -62
package/telegram-plugin/tests/progress-card-memory-bounds.test.ts +0 -84
package/telegram-plugin/tests/progress-card-pin-failure-paths.test.ts +0 -139
package/telegram-plugin/tests/progress-card-pin-manager.test.ts +0 -773
package/telegram-plugin/tests/progress-card-pin-race-fast-turn.test.ts +0 -66
package/telegram-plugin/tests/progress-card-pin-sidecar-partial-write.test.ts +0 -64
package/telegram-plugin/tests/progress-card-pin-watchdog.test.ts +0 -190
package/telegram-plugin/tests/progress-card-sigterm-pin-flush.test.ts +0 -146
package/telegram-plugin/tests/real-gateway-f1-ladder-integrity.test.ts +0 -123
package/telegram-plugin/tests/real-gateway-f2-instant-draft.test.ts +0 -82
package/telegram-plugin/tests/real-gateway-f3-late-card.test.ts +0 -114
package/telegram-plugin/tests/real-gateway-harness.ts +0 -699
package/telegram-plugin/tests/real-gateway-i6-turn-flush-replay-dedup.test.ts +0 -313
package/telegram-plugin/tests/real-gateway-ipc-lifecycle.test.ts +0 -299
package/telegram-plugin/tests/real-gateway-spec.test.ts +0 -487
package/telegram-plugin/tests/real-gateway.smoke.test.ts +0 -101
package/telegram-plugin/tests/setup-flow.test.ts +0 -510
package/telegram-plugin/tests/setup-state.test.ts +0 -146
package/telegram-plugin/tests/sync-chat-running-subagents.test.ts +0 -116
package/telegram-plugin/tests/turn-end-regressions.test.ts +0 -489
package/telegram-plugin/tests/turn-flush-card-takeover.test.ts +0 -218
package/telegram-plugin/tests/turn-flush-prose-recovery.test.ts +0 -78
package/telegram-plugin/tests/two-zone-bg-carry-full-lifecycle.test.ts +0 -131
package/telegram-plugin/tests/two-zone-bg-detection.test.ts +0 -120
package/telegram-plugin/tests/two-zone-bg-done-when-all-terminal.test.ts +0 -116
package/telegram-plugin/tests/two-zone-bg-early-turn-end.test.ts +0 -87
package/telegram-plugin/tests/two-zone-bg-survives-next-turn.test.ts +0 -211
package/telegram-plugin/tests/two-zone-card-cap.test.ts +0 -62
package/telegram-plugin/tests/two-zone-card-fleet-row.test.ts +0 -101
package/telegram-plugin/tests/two-zone-card-header-phases.test.ts +0 -78
package/telegram-plugin/tests/two-zone-card-html-balance.test.ts +0 -110
package/telegram-plugin/tests/two-zone-card-lifecycle.test.ts +0 -128
package/telegram-plugin/tests/two-zone-card-sanitise.test.ts +0 -58
package/telegram-plugin/tests/two-zone-card-snapshot.test.ts +0 -133
package/telegram-plugin/tests/two-zone-concurrent-turns-isolation.test.ts +0 -155
package/telegram-plugin/tests/two-zone-phasefor-precedence.test.ts +0 -117
package/telegram-plugin/tests/two-zone-snapshot-extras.test.ts +0 -187
package/telegram-plugin/tests/two-zone-stuck-edit-throttle.test.ts +0 -149
package/telegram-plugin/tests/two-zone-stuck-header-escalation.test.ts +0 -101
package/telegram-plugin/tests/two-zone-stuck-per-member.test.ts +0 -114
package/telegram-plugin/tests/two-zone-stuck-recovery.test.ts +0 -105
package/telegram-plugin/tests/waiting-ux-harness.ts +0 -381
package/telegram-plugin/tests/waiting-ux.e2e.test.ts +0 -233
package/telegram-plugin/turn-flush-prose-recovery.ts +0 -40
package/telegram-plugin/two-zone-card.ts +0 -269
package/telegram-plugin/uat/scenarios/smoke-clerk-reply.test.ts +0 -61

package/telegram-plugin/gateway/startup-network-retry.ts CHANGED Viewed

@@ -1,5 +1,6 @@
 /**
- * Bounded exponential-backoff retry for gateway startup network errors.
+ * Bounded exponential-backoff retry for gateway startup network errors,
+ * with classification of the failure mode so the caller can act.
  *
  * On 2026-04-29 all five switchroom gateways silently broke at boot because
  * `api.telegram.org` was unreachable for ~27 minutes after system boot (the
@@ -9,22 +10,29 @@
  * process alive but not polling. No crash, so systemd's `Restart=always` never
  * fired. Telegram → agent delivery was dead until manual restarts.
  *
- * This module provides:
- *
- *   `isBootNetworkError(err)`  — recognises network-layer errors thrown by
- *       grammy's HttpError wrapper and by raw fetch/Node network failures.
+ * Then issue #1076: a *revoked or wrong-typed* bot token returns Telegram API
+ * 401 `Unauthorized`. Pre-fix `gatewayStartupRetry` rethrew non-network errors
+ * immediately, the surrounding gateway catch block exited 1, the in-container
+ * `_switchroom_supervise` respawned, the new gateway re-hit 401, repeat. Ten
+ * restarts in <60 s tripped the supervisor cap and the gateway went silently
+ * dead with no operator-visible signal. This module now distinguishes 401 as
+ * a permanent config error, which the gateway handles by writing an issue +
+ * quarantine marker + exit-78 (the supervisor's "config error, don't
+ * restart" sentinel — see profiles/_base/start.sh.hbs).
  *
- *   `STARTUP_RETRY_DELAYS_MS`  — the chosen backoff schedule.
+ * This module provides:
  *
- *   `gatewayStartupRetry(fn, opts)` — drives the retry loop. Calls `fn()` up to
- *       `maxAttempts` times with delays from `delaysMs`. On success it resolves.
- *       On exhaustion it calls `opts.onExhausted()` (default: `process.exit(1)`)
- *       so systemd's `Restart=always` can restart the unit cleanly.
+ *   `classifyStartupError(err)` — returns `'network' | 'unauthorized' | 'other'`.
+ *   `isBootNetworkError(err)` — back-compat alias for the network arm.
+ *   `STARTUP_RETRY_DELAYS_MS` — the chosen backoff schedule.
+ *   `gatewayStartupRetry(fn, opts)` — drives the retry loop.
  *
  * The function is extracted from `gateway.ts`'s top-level IIFE so it can be
  * unit-tested without spinning up the full bot runtime.
  */
+export type StartupErrorKind = 'network' | 'unauthorized' | 'other'
 export interface StartupRetryOpts {
   /**
    * Delay schedule in milliseconds. Each attempt waits the corresponding
@@ -39,11 +47,23 @@ export interface StartupRetryOpts {
   sleep?: (ms: number) => Promise<void>
   /**
-   * Called when all attempts are exhausted. Should NOT return (exit/throw).
-   * Defaults to `process.exit(1)`.
+   * Called when all NETWORK retries are exhausted. Should NOT return
+   * (exit/throw). Defaults to `process.exit(1)` so systemd /
+   * `_switchroom_supervise` restart-on-failure can recycle the unit.
    */
   onExhausted?: (lastError: unknown) => never
+  /**
+   * Called when a startup API call returns 401 Unauthorized. The bot token
+   * is permanently wrong (revoked, wrong type, typo) — retrying just burns
+   * the supervisor restart budget. Caller should write an issue + quarantine
+   * marker and `process.exit(78)` (EX_CONFIG). Should NOT return.
+   *
+   * Default: same exit-1 path as `onExhausted` so callers that haven't been
+   * updated keep the pre-fix behaviour (rather than silently swallowing 401).
+   */
+  onUnauthorized?: (err: unknown) => never
   /** Log sink for retry progress messages. Defaults to process.stderr.write. */
   log?: (line: string) => void
 }
@@ -67,38 +87,83 @@ const DEFAULT_SLEEP = (ms: number): Promise<void> =>
   new Promise((resolve) => setTimeout(resolve, ms))
 /**
- * Returns true if `err` is a transient network-level failure that the startup
- * retry loop should absorb. Covers:
+ * Classify a startup-time error into one of:
  *
- * - Grammy's `HttpError` (name === 'HttpError'), which wraps fetch/ECONN errors
- *   during `deleteWebhook` and `getMe`.
- * - Raw Node/fetch errors: ECONNRESET, ETIMEDOUT, ENOTFOUND, ECONNREFUSED,
- *   fetch failed, etc.
+ *   - `network`: transient connectivity / DNS / TCP / fetch failure — the
+ *     retry loop should absorb these with backoff.
+ *   - `unauthorized`: Telegram API 401 (revoked or wrong-typed bot token).
+ *     Permanent until the operator rotates the token. Retrying compounds
+ *     the supervisor restart budget for no gain — see #1076.
+ *   - `other`: everything else (bad request shape, 5xx, server bug, etc.).
+ *     Rethrown to the surrounding gateway catch block, which exits non-zero
+ *     so the supervisor can recycle.
+ *
+ * Grammy surfaces 401 via `GrammyError` (name === 'GrammyError') with
+ * `error_code === 401`. Some test fixtures and node-fetch wrappers surface
+ * 401 only in the message string, so we fall through to a substring match
+ * for `Unauthorized` as defence in depth.
  */
-export function isBootNetworkError(err: unknown): boolean {
-  if (!(err instanceof Error)) return false
-  // Grammy wraps network errors in HttpError (name is set in the constructor)
-  if (err.name === 'HttpError') return true
+export function classifyStartupError(err: unknown): StartupErrorKind {
+  if (!(err instanceof Error)) return 'other'
+  // Unauthorized (#1076). Check BEFORE the network arm so a Grammy-wrapped
+  // 401 doesn't accidentally match the "Network request" substring branch
+  // through some future change to grammy's error stringification.
+  const errAny = err as Error & {
+    error_code?: number
+    name?: string
+  }
+  if (
+    errAny.name === 'GrammyError' &&
+    errAny.error_code === 401
+  ) {
+    return 'unauthorized'
+  }
+  // Fall-back string match. Telegram's API returns the literal token
+  // 'Unauthorized' for 401 in the description field. We avoid a substring
+  // of just '401' here because that can match unrelated error codes /
+  // ports / numeric content.
+  if (err.message.includes('Unauthorized')) return 'unauthorized'
+  // Network arm — grammy wraps fetch/ECONN errors in HttpError.
+  if (err.name === 'HttpError') return 'network'
   const msg = err.message
-  return (
+  if (
     msg.includes('ECONNRESET') ||
     msg.includes('ETIMEDOUT') ||
     msg.includes('ENOTFOUND') ||
     msg.includes('ECONNREFUSED') ||
     msg.includes('fetch failed') ||
     msg.includes('Network request')
-  )
+  ) {
+    return 'network'
+  }
+  return 'other'
+}
+/**
+ * Returns true if `err` is a transient network-level failure that the startup
+ * retry loop should absorb. Retained as a named export for the existing
+ * regression tests and downstream callers that only care about the network
+ * arm. Prefer `classifyStartupError` for new code.
+ */
+export function isBootNetworkError(err: unknown): boolean {
+  return classifyStartupError(err) === 'network'
 }
 /**
- * Attempt `fn()` and retry on `isBootNetworkError` failures using the
- * provided delay schedule.
+ * Attempt `fn()` and retry on network failures using the provided delay
+ * schedule.
  *
  * - On success: returns whatever `fn()` resolved to.
- * - On non-network error: re-throws immediately (not a transient boot issue).
- * - On exhausted retries: calls `opts.onExhausted(lastError)` which must not
- *   return (it should exit or throw). The default is `process.exit(1)` so
- *   systemd's `Restart=always` picks up the dead unit.
+ * - On unauthorized (401): calls `opts.onUnauthorized(err)` which must not
+ *   return. The gateway uses this to write an issue + quarantine marker
+ *   + `process.exit(78)`. Default is `process.exit(1)` for back-compat.
+ * - On other non-network error: re-throws immediately (not a transient
+ *   boot issue, not a known config error).
+ * - On exhausted network retries: calls `opts.onExhausted(lastError)` which
+ *   must not return. Default is `process.exit(1)`.
  */
 export async function gatewayStartupRetry<T>(
   fn: () => Promise<T>,
@@ -114,6 +179,16 @@ export async function gatewayStartupRetry<T>(
       )
       process.exit(1)
     })
+  const onUnauthorized: (err: unknown) => never =
+    opts.onUnauthorized ??
+    ((err: unknown) => {
+      // Back-compat default. Real callers (gateway.ts) override this with
+      // an issue-sink writer + quarantine-marker writer + exit-78.
+      process.stderr.write(
+        `telegram gateway: startup unauthorized (bot token rejected) — exiting: ${(err as Error).message}\n`,
+      )
+      process.exit(1)
+    })
   const log =
     opts.log ??
     ((line: string) => {
@@ -127,7 +202,10 @@ export async function gatewayStartupRetry<T>(
     try {
       return await fn()
     } catch (err) {
-      if (!isBootNetworkError(err)) throw err
+      const kind = classifyStartupError(err)
+      if (kind === 'unauthorized') return onUnauthorized(err)
+      if (kind === 'other') throw err
+      // network
       lastError = err
       if (attempt >= maxAttempts) break
       const delayMs = delays[attempt - 1]

package/telegram-plugin/gateway/vault-grant-inbound-builders.ts ADDED Viewed

@@ -0,0 +1,125 @@
+/**
+ * Pure builders for the synthetic `vault_grant_approved` and
+ * `vault_grant_denied` inbounds the gateway injects after the
+ * operator taps Approve / Deny on a `vault_request_access` card
+ * (#1052 / #1150).
+ *
+ * Extracted from `gateway.ts` so the InboundMessage shape is pinned
+ * by tests separate from the broker/IPC plumbing. The shape is
+ * load-bearing — it carries the `meta.source` field the bridge keys
+ * on when rendering `<channel source="vault_grant_approved">` /
+ * `<channel source="vault_grant_denied">` blocks for the model, and
+ * the `meta.{agent,key,scope,stage_id,operator_id}` fields that
+ * downstream filters / dashboards may anchor on.
+ *
+ * A regression that drops a meta field or changes the source string
+ * would silently break the agent's wake-up flow — the bridge wouldn't
+ * recognize the source and route as a generic channel event, the
+ * model wouldn't know it was an approval response, and the
+ * conversation would drift. Pinning the builders against fixture
+ * tests is cheaper than catching that downstream.
+ */
+import type { InboundMessage } from './ipc-protocol.js'
+/** Subset of the pending-request state the builders need. Kept narrow
+ *  so callers don't have to pass the full PendingVaultRequestAccess. */
+export interface VaultGrantInboundContext {
+  agent: string
+  key: string
+  scope: 'read' | 'write'
+  /** Telegram chat id where the approval card lived. Used as the
+   *  inbound's chatId — keeps the synthesized turn associated with
+   *  the conversation that triggered the request. */
+  chat_id: string
+  /** Seconds. For approved grants; ignored for deny. */
+  ttl_seconds: number
+}
+/**
+ * Build the synthetic InboundMessage for a successful operator
+ * approval. Meta fields are pinned by tests.
+ *
+ * @param ctx              Per-request context (agent, key, scope, chat).
+ * @param grantId          Broker-returned grant id (e.g. "vg_a1b2c3").
+ * @param stageId          The card's stage id from the approval flow.
+ * @param operatorId       Telegram user id of the approving operator
+ *                         (string for portability — Telegram ids are
+ *                         numeric but routinely round-trip as strings).
+ * @param nowMs            Wall-clock ms. Used for both `ts` and
+ *                         `messageId` so the helper is deterministic
+ *                         under fake clock. Defaults to `Date.now()`.
+ */
+export function buildVaultGrantApprovedInbound(opts: {
+  ctx: VaultGrantInboundContext
+  grantId: string
+  stageId: string
+  operatorId: string
+  nowMs?: number
+}): InboundMessage {
+  const ts = opts.nowMs ?? Date.now()
+  const days = Math.round(opts.ctx.ttl_seconds / 86400)
+  return {
+    type: 'inbound',
+    chatId: opts.ctx.chat_id,
+    messageId: ts, // synthetic — no Telegram message id exists
+    user: 'vault-broker',
+    userId: 0,
+    ts,
+    text:
+      `✅ Operator approved your vault access request for ` +
+      `\`${opts.ctx.key}\` (scope=${opts.ctx.scope}, ` +
+      `${days}d, grant=${opts.grantId}). ` +
+      `The token has been written. Please resume the task that was ` +
+      `waiting on this credential — fetch via the usual switchroom vault ` +
+      `get path.`,
+    meta: {
+      source: 'vault_grant_approved',
+      agent: opts.ctx.agent,
+      key: opts.ctx.key,
+      scope: opts.ctx.scope,
+      grant_id: opts.grantId,
+      stage_id: opts.stageId,
+      operator_id: opts.operatorId,
+    },
+  }
+}
+/**
+ * Build the synthetic InboundMessage for an operator denial.
+ *
+ * The text steers the model toward a fallback path (apologise, try a
+ * different approach, skip the feature) — added in #1156 alongside
+ * the buffer-on-disconnect fix because the deny side had the same
+ * agent-stays-idle bug as the approve side.
+ */
+export function buildVaultGrantDeniedInbound(opts: {
+  ctx: VaultGrantInboundContext
+  stageId: string
+  operatorId: string
+  nowMs?: number
+}): InboundMessage {
+  const ts = opts.nowMs ?? Date.now()
+  return {
+    type: 'inbound',
+    chatId: opts.ctx.chat_id,
+    messageId: ts,
+    user: 'vault-broker',
+    userId: 0,
+    ts,
+    text:
+      `🚫 Operator denied your vault access request for ` +
+      `\`${opts.ctx.key}\` (scope=${opts.ctx.scope}). ` +
+      `The credential is unavailable — pick a fallback for the original task ` +
+      `(apologise to the user, try a different approach, or skip the feature). ` +
+      `Do NOT re-request this key without first asking the user.`,
+    meta: {
+      source: 'vault_grant_denied',
+      agent: opts.ctx.agent,
+      key: opts.ctx.key,
+      scope: opts.ctx.scope,
+      stage_id: opts.stageId,
+      operator_id: opts.operatorId,
+    },
+  }
+}

package/telegram-plugin/history.ts CHANGED Viewed

@@ -195,6 +195,69 @@ export function _resetForTests(): void {
   }
 }
+/**
+ * Issue a WAL checkpoint on the history DB, releasing `*.db-wal` pages
+ * back to the main DB and truncating the WAL file. Called by the
+ * gateway's periodic reaper so the WAL doesn't grow unbounded in
+ * long-running agent sessions (issue #1073).
+ *
+ * Wrapped in try/catch — `PRAGMA wal_checkpoint(TRUNCATE)` can return
+ * SQLITE_BUSY under reader pressure, which bun:sqlite raises as a thrown
+ * error. That's non-fatal; the next reaper tick retries. Returns true
+ * on success, false on a swallowed error.
+ *
+ * No-op (returns false) if `initHistory` was never called.
+ */
+export function checkpointWal(): boolean {
+  if (db == null) return false
+  try {
+    db.prepare('PRAGMA wal_checkpoint(TRUNCATE)').run()
+    return true
+  } catch {
+    return false
+  }
+}
+/**
+ * Prune `messages` rows older than `retentionDays`. Used by the periodic
+ * reaper (#1073) to catch the case where the gateway runs for weeks or
+ * months — the init-time prune only fires once at boot.
+ *
+ * Returns the number of rows deleted (sum across all batches). No-op
+ * if `retentionDays <= 0` or if `initHistory` was never called.
+ *
+ * Batched to keep transactions short; otherwise a years-old DB on first
+ * boot after an upgrade would lock the inbound write path for the duration
+ * of a single multi-million-row DELETE. Uses the rowid-subselect form
+ * because bun:sqlite is built without SQLITE_ENABLE_UPDATE_DELETE_LIMIT
+ * (same constraint as reaper.ts).
+ */
+export function pruneMessagesOlderThanDays(
+  retentionDays: number,
+  nowSec?: number,
+  batchLimit = 5000,
+): number {
+  if (db == null) return 0
+  if (retentionDays <= 0) return 0
+  const cutoffSec = (nowSec ?? Math.floor(Date.now() / 1000)) - retentionDays * 86400
+  const stmt = db.prepare(`
+    DELETE FROM messages
+    WHERE rowid IN (
+      SELECT rowid FROM messages WHERE ts < ? LIMIT ?
+    )
+  `)
+  let total = 0
+  // Same defence-in-depth ceiling as reaper.ts — caps a single call at
+  // 5M rows at the default batch size, more than any healthy fleet.
+  for (let i = 0; i < 1000; i++) {
+    const result = stmt.run(cutoffSec, batchLimit) as { changes: number }
+    const n = result.changes ?? 0
+    total += n
+    if (n === 0) break
+  }
+  return total
+}
 function requireDb(): SqliteDatabase {
   if (db == null) {
     throw new Error('history: initHistory() must be called before any record/query operation')
@@ -430,6 +493,34 @@ export function getLatestInboundMessageId(
   return row?.message_id ?? null
 }
+/**
+ * Look up the role + text of a single message by (chat_id, message_id).
+ * Returns `null` if no row exists (the message predates history, the
+ * row was reaped, or history is disabled). Used by the reaction-trigger
+ * handler (#1074) to decide whether a reacted-to message is bot-authored
+ * AND to pull the preview text for the synthesized inbound — both in
+ * one DB hit, so the trigger predicate doesn't need a Telegram API call
+ * per reaction.
+ *
+ * Telegram message_ids are unique within a chat regardless of thread,
+ * so we match on (chat_id, message_id) and ignore thread_id — same as
+ * recordEdit / recordReaction.
+ */
+export function lookupMessageRoleAndText(
+  chatId: string,
+  messageId: number,
+): { role: 'user' | 'assistant'; text: string } | null {
+  const row = requireDb()
+    .prepare(
+      `SELECT role, text FROM messages WHERE chat_id = ? AND message_id = ? LIMIT 1`,
+    )
+    .get(chatId, messageId) as
+    | { role: 'user' | 'assistant'; text: string | null }
+    | undefined
+  if (!row) return null
+  return { role: row.role, text: row.text ?? '' }
+}
 export function getRecentOutboundCount(
   chatId: string,
   withinSeconds: number,

package/telegram-plugin/hooks/hooks.json CHANGED Viewed

@@ -40,6 +40,16 @@
             "timeout": 10
           }
         ]
+      },
+      {
+        "matcher": ".*",
+        "hooks": [
+          {
+            "type": "command",
+            "command": "node \"${CLAUDE_PLUGIN_ROOT}/hooks/sandbox-hint-posttool.mjs\"",
+            "timeout": 3
+          }
+        ]
       }
     ],
     "Stop": [

package/telegram-plugin/hooks/sandbox-hint-posttool.mjs ADDED Viewed

@@ -0,0 +1,130 @@
+#!/usr/bin/env node
+/**
+ * PostToolUse hook — detects sandbox-related errors in tool_response and
+ * injects a one-line hint via Claude Code's `hookSpecificOutput.
+ * additionalContext` channel. The hint reminds the agent that the
+ * read-only file system / EROFS error is the switchroom sandbox working
+ * as intended, and that it should respond to the user with a concrete
+ * "Operator action: ..." line rather than retrying or echoing the raw
+ * kernel error.
+ *
+ * Pairs with the SANDBOX_GUIDANCE primer in --append-system-prompt
+ * (src/agents/scaffold.ts). The primer is the always-on context; this
+ * hook is the just-in-time nudge that fires only when the agent
+ * actually hits the boundary.
+ *
+ * Claude Code PostToolUse protocol:
+ *   stdin:  JSON { tool_name, tool_use_id, tool_input, tool_response, ... }
+ *   stdout: optional JSON
+ *             {"hookSpecificOutput":{"hookEventName":"PostToolUse",
+ *              "additionalContext":"<text>"}}
+ *           prepended to the model's next-turn context after the tool
+ *           result is shown.
+ *   exit:   0 always. Hook failures must never block the tool flow.
+ *
+ * Design notes:
+ *   - Detection is a substring/regex match against the stringified
+ *     tool_response (covers stdout, stderr, error fields).
+ *   - No DB writes, no IPC. Pure stdin → stdout, fail-silent.
+ *   - Idempotent: re-reading the same tool_response yields the same
+ *     hint. Claude Code dedupes additionalContext naturally because the
+ *     hook fires once per PostToolUse event.
+ */
+import { readFileSync } from 'node:fs'
+function readStdin() {
+  try {
+    return readFileSync(0, 'utf8')
+  } catch {
+    return ''
+  }
+}
+/**
+ * Patterns that indicate a sandbox-boundary hit, in order of specificity.
+ * Each entry: [regex, hint-key]. Hint text is composed below from the
+ * matched key — keeps the patterns easy to scan.
+ */
+const PATTERNS = [
+  // The canonical kernel error code + message. Covers most write/mkdir/
+  // rename/unlink failures against the read-only rootfs.
+  [/\bEROFS\b/, 'erofs'],
+  [/read[- ]only file ?system/i, 'erofs'],
+  // npm/pip install attempts that hit a read-only prefix. These usually
+  // surface as ENOENT or permission errors against /usr/lib/node_modules
+  // or /usr/local/lib — listing the explicit paths keeps us from
+  // false-matching on user code that legitimately mentions /usr.
+  [/EACCES.+\/(usr|opt|etc|bin|lib)\//, 'eacces-rootfs'],
+  // apt / dpkg refusing to write to /var/lib/dpkg etc.
+  [/dpkg.*permission denied|apt.*permission denied|Unable to acquire the dpkg/i, 'apt'],
+]
+function buildHint(key) {
+  const common =
+    'Sandbox boundary hit. The agent container has `read_only: true` rootfs ' +
+    '(see the SANDBOX primer in the system prompt). Do NOT retry the same ' +
+    'write. Tell the user what you tried, why the sandbox blocked it, and ' +
+    'name an operator action (e.g. "edit on host then `switchroom apply`", ' +
+    'or "add to docker/Dockerfile.agent and rebuild"). Writable paths: ' +
+    '$HOME (/state/agent/home), /tmp, /state/agent/**, /var/log/switchroom.'
+  if (key === 'apt') {
+    return (
+      common +
+      ' For package installs specifically: ask the operator to add the ' +
+      'package to docker/Dockerfile.agent and rebuild the agent image — ' +
+      'in-container apt is not the right path.'
+    )
+  }
+  return common
+}
+function emitContext(text) {
+  const payload = {
+    hookSpecificOutput: {
+      hookEventName: 'PostToolUse',
+      additionalContext: text,
+    },
+  }
+  process.stdout.write(JSON.stringify(payload) + '\n')
+}
+function main() {
+  const raw = readStdin()
+  if (!raw) return
+  let evt
+  try {
+    evt = JSON.parse(raw)
+  } catch {
+    return
+  }
+  // tool_response shape varies by tool — string for Bash, object with
+  // file/oldString/newString for Edit/Write, etc. Stringify the whole
+  // thing so we match against every nested error field at once. Cap the
+  // scan window to keep memory bounded if the model just dumped a 10MB
+  // log into the tool_response.
+  let body
+  try {
+    body = JSON.stringify(evt.tool_response ?? '')
+  } catch {
+    return
+  }
+  if (!body) return
+  if (body.length > 64 * 1024) body = body.slice(0, 64 * 1024)
+  for (const [pattern, key] of PATTERNS) {
+    if (pattern.test(body)) {
+      emitContext(buildHint(key))
+      return
+    }
+  }
+}
+try {
+  main()
+} catch {
+  // Fail-silent. The PostToolUse must never block the tool flow.
+}

package/telegram-plugin/hooks/subagent-tracker-posttool.mjs CHANGED Viewed

@@ -11,7 +11,13 @@
  * block the tool response.
  *
  * DB location: <agentDir>/telegram/registry.db
- *   agentDir = SWITCHROOM_AGENT_DIR env var, falling back to process.cwd()
+ *   agentDir lookup (first hit wins):
+ *     1. SWITCHROOM_AGENT_DIR env var (explicit override, mainly used in tests)
+ *     2. TELEGRAM_STATE_DIR with `/telegram` suffix stripped — the canonical
+ *        env var start.sh exports on every switchroom agent. See the
+ *        sibling pretool hook docblock for why this lookup matters (without
+ *        it the hook used to write to a registry.db nobody read).
+ *     3. process.cwd() (legacy fallback for ad-hoc invocations).
  *
  * Performance: the actual DB write is deferred via setImmediate (Node 22+
  * node:sqlite path) or non-blocking spawn (CLI fallback) so the hook returns
@@ -268,7 +274,18 @@ function main() {
   const id = event.tool_use_id ?? null
   if (!id) process.exit(0)
-  const agentDir = process.env.SWITCHROOM_AGENT_DIR ?? process.cwd()
+  // Same agent-dir resolution as the pretool hook (Bug 2 fix). Without
+  // the TELEGRAM_STATE_DIR derivation the posttool would write the
+  // `ended_at` row to a registry.db nobody reads, even though the row
+  // was originally inserted by the pretool hook that DID write to the
+  // correct DB (after this PR). Keep the two hooks in lock-step.
+  const stateDir = process.env.TELEGRAM_STATE_DIR
+  const derivedFromStateDir = stateDir && stateDir.endsWith('/telegram')
+    ? stateDir.slice(0, -'/telegram'.length)
+    : null
+  const agentDir = process.env.SWITCHROOM_AGENT_DIR
+    ?? derivedFromStateDir
+    ?? process.cwd()
   const dbPath = join(agentDir, 'telegram', 'registry.db')
   // If DB doesn't exist yet, nothing to update

package/telegram-plugin/hooks/subagent-tracker-pretool.mjs CHANGED Viewed

@@ -11,7 +11,17 @@
  * block the tool call.
  *
  * DB location: <agentDir>/telegram/registry.db
- *   agentDir = SWITCHROOM_AGENT_DIR env var, falling back to process.cwd()
+ *   agentDir lookup (first hit wins):
+ *     1. SWITCHROOM_AGENT_DIR env var (explicit override, mainly used in tests)
+ *     2. TELEGRAM_STATE_DIR with `/telegram` suffix stripped — the canonical
+ *        env var start.sh exports for every switchroom agent (and the same
+ *        path the gateway + watcher resolve their DB through). Without this
+ *        the hook used to fall through to process.cwd() in production,
+ *        writing to a registry.db nobody read, leaving every bg sub-agent
+ *        invisible to the watcher. Surfaced by
+ *        bg-sub-agent-dispatch-dm.test.ts; see RFC Phase 2 §Bug 2 in
+ *        reference/sub-agent-visibility-rfc.md.
+ *     3. process.cwd() (legacy fallback for ad-hoc invocations).
  *
  * Performance: the actual DB write is deferred via setImmediate (Node 22+
  * node:sqlite path) or a non-blocking spawn (CLI fallback) so the hook
@@ -223,7 +233,17 @@ function main() {
   // misroute).
   if (event.tool_name !== 'Agent' && event.tool_name !== 'Task') process.exit(0)
-  const agentDir = process.env.SWITCHROOM_AGENT_DIR ?? process.cwd()
+  // Resolve agent dir: explicit env override → derive from TELEGRAM_STATE_DIR
+  // (start.sh exports this on every agent) → cwd fallback. The middle case
+  // is the production path; without it the hook silently wrote to a
+  // registry.db nobody read (#709 / #776 / #782 / #788 Bug 2).
+  const stateDir = process.env.TELEGRAM_STATE_DIR
+  const derivedFromStateDir = stateDir && stateDir.endsWith('/telegram')
+    ? stateDir.slice(0, -'/telegram'.length)
+    : null
+  const agentDir = process.env.SWITCHROOM_AGENT_DIR
+    ?? derivedFromStateDir
+    ?? process.cwd()
   const telegramDir = join(agentDir, 'telegram')
   const dbPath = join(telegramDir, 'registry.db')

package/telegram-plugin/hooks/tool-label-pretool.mjs CHANGED Viewed

@@ -111,6 +111,17 @@ export function computeLabel(toolName, input) {
     case 'KillBash':
     case 'KillShell':
       return 'Stopping background process'
+    case 'Skill': {
+      // The Skill tool's input is `{ skill: "<slug>", args?: "..." }`.
+      // We emit `Running skill <slug>` so downstream observers
+      // (notably the skill-coverage UAT runner at
+      // telegram-plugin/uat/runners/skill-coverage.ts) can tail the
+      // sidecar JSONL and recover which skill fired per turn —
+      // the progress card path that used to surface this was retired
+      // when `progressDriver` was nulled out in #1122 PR3.
+      const slug = clip(String(i.skill ?? ''), 64)
+      return slug ? `Running skill ${slug}` : null
+    }
   }
   // MCP allowlist.