npm - switchroom - Versions diffs - 0.5.0 → 0.7.9 - Mend

switchroom 0.5.0 → 0.7.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (89) hide show

package/README.md +142 -121
package/bin/autoaccept.exp +29 -6
package/dist/agent-scheduler/index.js +12261 -0
package/dist/cli/autoaccept-poll.js +10 -0
package/dist/cli/switchroom.js +27250 -25324
package/dist/vault/approvals/kernel-server.js +12709 -0
package/dist/vault/broker/server.js +15724 -0
package/package.json +4 -3
package/profiles/_base/start.sh.hbs +133 -0
package/profiles/_shared/telegram-style.md.hbs +3 -3
package/profiles/default/CLAUDE.md +3 -3
package/profiles/default/CLAUDE.md.hbs +2 -2
package/profiles/default/workspace/CLAUDE.md.hbs +9 -0
package/skills/docx/VENDORED.md +1 -1
package/skills/mcp-builder/VENDORED.md +1 -1
package/skills/pdf/VENDORED.md +1 -1
package/skills/pptx/VENDORED.md +1 -1
package/skills/skill-creator/VENDORED.md +1 -1
package/skills/switchroom-architecture/SKILL.md +8 -7
package/skills/switchroom-cli/SKILL.md +23 -15
package/skills/switchroom-health/SKILL.md +7 -7
package/skills/switchroom-install/SKILL.md +36 -39
package/skills/switchroom-manage/SKILL.md +4 -4
package/skills/switchroom-status/SKILL.md +1 -1
package/skills/webapp-testing/VENDORED.md +1 -1
package/skills/xlsx/VENDORED.md +1 -1
package/telegram-plugin/admin-commands/dispatch.test.ts +119 -1
package/telegram-plugin/admin-commands/index.ts +71 -0
package/telegram-plugin/ask-user.ts +1 -0
package/telegram-plugin/card-event-log.ts +138 -0
package/telegram-plugin/dist/bridge/bridge.js +178 -31
package/telegram-plugin/dist/foreman/foreman.js +6875 -6526
package/telegram-plugin/dist/gateway/gateway.js +13862 -11834
package/telegram-plugin/dist/server.js +202 -40
package/telegram-plugin/fleet-state.ts +25 -10
package/telegram-plugin/foreman/foreman.ts +38 -3
package/telegram-plugin/gateway/approval-callback.ts +126 -0
package/telegram-plugin/gateway/approval-card.test.ts +90 -0
package/telegram-plugin/gateway/approval-card.ts +127 -0
package/telegram-plugin/gateway/approvals-commands.ts +126 -0
package/telegram-plugin/gateway/boot-card.ts +31 -6
package/telegram-plugin/gateway/boot-probes.ts +510 -72
package/telegram-plugin/gateway/gateway.ts +822 -94
package/telegram-plugin/gateway/ipc-protocol.ts +34 -1
package/telegram-plugin/gateway/ipc-server.ts +35 -0
package/telegram-plugin/gateway/startup-mutex.ts +110 -2
package/telegram-plugin/hooks/hooks.json +19 -0
package/telegram-plugin/hooks/tool-label-pretool.mjs +216 -0
package/telegram-plugin/hooks/tool-label-stop.mjs +63 -0
package/telegram-plugin/package.json +4 -1
package/telegram-plugin/plugin-logger.ts +20 -1
package/telegram-plugin/progress-card-driver.ts +202 -13
package/telegram-plugin/progress-card.ts +2 -2
package/telegram-plugin/quota-check.ts +1 -0
package/telegram-plugin/registry/subagents-schema.ts +37 -0
package/telegram-plugin/registry/subagents.test.ts +64 -0
package/telegram-plugin/session-tail.ts +58 -5
package/telegram-plugin/shared/bot-runtime.ts +48 -2
package/telegram-plugin/subagent-watcher.ts +139 -7
package/telegram-plugin/tests/_progress-card-harness.ts +4 -0
package/telegram-plugin/tests/bg-agent-progress-card-757.test.ts +201 -0
package/telegram-plugin/tests/boot-card-probe-target.test.ts +10 -34
package/telegram-plugin/tests/boot-card-render.test.ts +6 -5
package/telegram-plugin/tests/boot-probes.test.ts +564 -0
package/telegram-plugin/tests/card-event-log.test.ts +145 -0
package/telegram-plugin/tests/gateway-startup-mutex.test.ts +102 -0
package/telegram-plugin/tests/ipc-server-validate-inject-inbound.test.ts +134 -0
package/telegram-plugin/tests/progress-card-delay-842.test.ts +160 -0
package/telegram-plugin/tests/quota-check.test.ts +37 -1
package/telegram-plugin/tests/subagent-registry-bugs.test.ts +5 -0
package/telegram-plugin/tests/subagent-watcher-stall-notification.test.ts +104 -1
package/telegram-plugin/tests/subagent-watcher.test.ts +5 -0
package/telegram-plugin/tests/tool-label-sidecar.test.ts +114 -0
package/telegram-plugin/tests/two-zone-bg-done-when-all-terminal.test.ts +5 -3
package/telegram-plugin/tests/two-zone-card-header-phases.test.ts +10 -0
package/telegram-plugin/tests/two-zone-snapshot-extras.test.ts +58 -14
package/telegram-plugin/tests/welcome-text.test.ts +57 -0
package/telegram-plugin/tool-label-sidecar.ts +140 -0
package/telegram-plugin/tool-labels.ts +55 -0
package/telegram-plugin/two-zone-card.ts +27 -7
package/telegram-plugin/uat/SETUP.md +160 -0
package/telegram-plugin/uat/assertions.ts +140 -0
package/telegram-plugin/uat/driver.ts +174 -0
package/telegram-plugin/uat/harness.ts +161 -0
package/telegram-plugin/uat/login.ts +134 -0
package/telegram-plugin/uat/port-allocator.ts +71 -0
package/telegram-plugin/uat/scenarios/smoke-clerk-reply.test.ts +61 -0
package/telegram-plugin/welcome-text.ts +44 -2
package/bin/bridge-watchdog.sh +0 -967

package/README.md CHANGED Viewed

@@ -9,29 +9,19 @@
 [![Trigger evals](https://img.shields.io/endpoint?url=https%3A%2F%2Fgist.githubusercontent.com%2Fmekenthompson%2F002f3482b19111d35e57c1903b3733e2%2Fraw%2Fswitchroom-trigger-evals.json)](https://buildkite.com/ken-thompson/switchroom)
 [![Quality evals](https://img.shields.io/endpoint?url=https%3A%2F%2Fgist.githubusercontent.com%2Fmekenthompson%2F002f3482b19111d35e57c1903b3733e2%2Fraw%2Fswitchroom-quality-evals.json)](https://buildkite.com/ken-thompson/switchroom)
-**Your Claude Pro or Max, as a fleet of always-on agents in Telegram. Opinionated UX, done properly.**
+**A switchboard for your Pro or Max.** Your Claude subscription, as a fleet of always-on specialist agents you talk to from Telegram. Opinionated UX, done properly.
 > *I loved OpenClaw + Telegram. I wanted my Claude subscription. And the UX done properly. So I built this.*
-**Compliance-by-design.** Switchroom leverages Claude Code natively — unmodified `claude` CLI, no Agent SDK, no direct API. It sets up the CLI the way you would, then gets out of the way. See the [Compliance Attestation](docs/compliance-attestation.md) for detail.
+[Latest release notes →](CHANGELOG.md)
-## Right, so what's this about
+## See what your agent is doing
-So you had the bright idea. Run Claude Code agents 24/7 on a cheap Linux box, talk to them from Telegram, use the Claude Pro or Max subscription you're already paying for. Sensible. Obvious, even.
-Then you tried OpenClaw. Followed the docs, spun it up, got it running, only to realise halfway through that you're pinging the Anthropic API on your own key and your token bill is quietly ticking over in the background. Bit of a bait and switch, that one. You signed up for "use your subscription," not "buy API credits on top of your subscription."
-So you gave Claude Code's built-in Telegram channel a crack instead. Sent a message. Waited. Something happened, maybe. Eventually a reply came back. What did the agent actually do? No idea. Which tools ran? No idea. Did it get stuck, crash, spawn a sub-agent, read half your repo? No idea. It's an MVP black box of death, and I got sick of squinting into it.
-So I built this.
-## What Switchroom is, and isn't
-Switchroom is an opinionated implementation of a Telegram plugin and agent lifecycle layer, sitting on top of the official `claude` CLI. No fork. No custom runtime in Docker. No API key interception. Your Claude Pro or Max subscription does the work, the same way it does on your desktop, authenticated via the same OAuth flow, fully compliant with Anthropic's terms.
+Every time an agent starts work, a **progress card** pins into its Telegram topic and updates in place as tools execute. Each Read, Bash, Edit, Grep is visible as it happens, with elapsed time so you can tell if something's stuck. Sub-agents surface in the same card. When the agent finishes, the card flips to Done and unpins.
-It is not trying to be a general-purpose LLM orchestrator. It doesn't care about OpenAI, Gemini, Llama, or swapping model providers. It is not a multi-channel bridge for Slack, Discord, Teams. It does one thing: makes Telegram the best possible interaction surface for Claude Code. Unashamedly.
+No silent gaps. No ghosts. No squinting into a black box.
-The whole thing is built around one idea. Every time an agent starts work, a **progress card** pops into Telegram and stays pinned while the task runs. It updates in place as tools execute, so you see each Read, Bash, Edit, Grep happen as it happens.
+<p align="center"><img src="docs/diagrams/progress-card-anatomy.jpg" width="700" alt="Annotated progress card: pin badge, user quote, last 5 steps, collapsed older, in-flight pulse, elapsed timer, sub-agent indent"></p>
 ```
 ⚙️ Working… · ⏱ 12s
@@ -43,63 +33,114 @@ The whole thing is built around one idea. Every time an agent starts work, a **p
   🤖 Edit src/auth/jwt.ts · 4s
 ```
-When the agent finishes, the card flips to Done and unpins. Two agents working at the same time? Each gets its own card, labelled `(1/2)` and `(2/2)`, so you can follow both without losing the plot.
+The card is the headline UX. The rest of the product is in service of it.
+- Cards update at most once every 5 seconds. Fast enough to follow, not so fast it floods.
+- Last 5 steps stay visible. Older ones collapse into `(+N more earlier steps)`.
+- Running steps show elapsed time so a stuck tool is obvious.
+- Tool labels are deterministic, written by a `PreToolUse` hook, so the card never lies about what's running.
+- Two agents working at once? Each gets its own card, labelled `(1/2)` and `(2/2)`.
+### Sub-agent visibility
+When an agent delegates to a sub-agent — Opus plans, Sonnet implements — the sub-agent's work shows up indented inside the parent's pinned card. One pinned surface per task, however many processes it spawns underneath. Nothing gets buried in a side-channel you have to go look for.
-## The UX bits that matter
+### Right, so what's this about
-- Cards update at most once every 5 seconds. Fast enough to follow, not so fast it floods
-- Last 5 steps are always visible, older ones collapse into `(+N more earlier steps)`
-- Running steps show elapsed time so you can tell if something's stuck
-- Sub-agents get their own section in the card, so nested work is visible, not hidden
-- No silent gaps. No ghosts.
+So you had the bright idea. Run Claude Code agents 24/7 on a cheap Linux box, talk to them from Telegram, use the Claude Pro or Max subscription you're already paying for. Sensible. Obvious, even.
+Then you tried OpenClaw. Followed the docs, spun it up, got it running, only to realise halfway through that you're pinging the Anthropic API on your own key and your token bill is quietly ticking over in the background. Bit of a bait and switch, that one. You signed up for "use your subscription," not "buy API credits on top of your subscription."
+So you gave Claude Code's built-in Telegram channel a crack instead. Sent a message. Waited. Something happened, maybe. Eventually a reply came back. What did the agent actually do? No idea. Which tools ran? No idea. Did it get stuck, crash, spawn a sub-agent, read half your repo? No idea. It's an MVP black box of death, and I got sick of squinting into it.
+So I built this.
+## What you get
+| Feature | What it does |
+|---|---|
+| **Progress cards** | Pinned, in-place, every tool call visible. The headline UX. |
+| **Claude Pro/Max auth** | OAuth, not API keys. No per-token billing. Multi-account fallback pool per agent. |
+| **Approval kernel** | Inline allow/deny cards in Telegram for every gated tool. TTL'd grants, full audit trail. |
+| **Sub-agents** | Opus plans, Sonnet implements. Sub-agent work surfaces in the parent card. |
+| **Config cascade** | Defaults, then profiles, then per-agent YAML. Change one line, every agent updates. |
+| **Scheduled tasks** | Cron-syntax tasks that fire across reboots. Headless secret access via the vault broker. |
+| **Persistent memory** | Hindsight semantic memory with knowledge graphs and mental models. |
+| **Session continuity** | Resume across restarts with freshness gating and a wake-audit. |
+| **Encrypted vault** | AES-256-GCM for secrets. Optional auto-unlock keyed off `/etc/machine-id`. |
+| **Drive MCP** | Read Google Docs, Sheets, and Drive files inline. Per-agent OAuth, no shared key. |
+| **Card audit log** | Every progress-card edit appended to `card-events.jsonl` for retrospective debugging. |
+| **15 Telegram MCP tools** | Reply, stream replies, edit, pin, react, native checklists, sticker aliases, voice-in transcription, attachments, history. |
 ## Architecture
-One Claude Code REPL per agent, dressed up with systemd and a Telegram bot. Two systemd units per agent: the Claude process (`switchroom-<agent>.service`) and its Telegram gateway (`switchroom-<agent>-gateway.service`). See [`docs/architecture.md`](docs/architecture.md) for the process model, IPC layout, and how each layer maps to the `claude` CLI.
+One long-running service per agent. Each agent runs the stock `claude` CLI — not a fork, not the Agents SDK, not a wrapped harness — authenticated directly with Anthropic via official OAuth. Switchroom is scaffolding and lifecycle around the CLI you'd run by hand: a Telegram bot, an approval broker, a vault broker, and Docker Compose for supervision. See [`docs/architecture.md`](docs/architecture.md) for the process model and how each layer maps to the `claude` CLI.
 ```
 You (Telegram)
     │
     ▼
-@YourBot ──── switchroom-telegram MCP ──── Claude Code CLI
-                  │                        │
-                  ├─ Progress cards         ├─ .claude/agents/*.md (sub-agents)
-                  ├─ Pin / unpin lifecycle  ├─ settings.json (tools, hooks, MCP)
-                  ├─ SQLite history         ├─ Hindsight plugin (memory)
-                  ├─ Emoji reactions        └─ systemd (agent + cron timers)
-                  └─ Format conversion
+@YourBot ──┬── switchroom-telegram MCP ──┬── agent supervisor ─── Claude Code CLI
+           │       (15 tools)            │     (per-agent)        │
+           │                             │                        ├─ .claude/agents/*.md (sub-agents)
+           ├─ Progress cards             ├─ Approval kernel ◄─────┤   settings.json (tools, hooks, MCP)
+           ├─ Pin / unpin lifecycle      │   (allow/deny broker)  ├─ Hindsight plugin (memory)
+           ├─ SQLite history             ├─ Vault broker ◄────────┤   Drive MCP, Playwright MCP, …
+           ├─ Card-events.jsonl audit    │   (cron secrets, IPC)  └─ scheduled tasks across reboots
+           ├─ Emoji reactions            │
+           └─ Format conversion          └─ Docker Compose restart (unless-stopped)
 ```
-Switchroom is **not a harness**. Each agent runs the unmodified `claude` binary, authenticated directly with Anthropic via official OAuth. No credential interception, no API key routing.
+See [`docs/architecture.md`](docs/architecture.md) for the process model, IPC layout, supervisor choice, and how each layer maps to the `claude` CLI.
-## Everything else you get
+## Approvals & safety
-| Feature | What it does |
-|---------|-------------|
-| **Claude Pro/Max auth** | OAuth, not API keys. No per-token billing. |
-| **Multi-agent** | Opus plans, Sonnet implements in the background. Sub-agent work surfaces in the card. |
-| **Config cascade** | Defaults, then profiles, then per-agent YAML. Change one line, every agent updates. |
-| **Scheduled tasks** | Cron-based systemd timers. Survive reboots. |
-| **Persistent memory** | Hindsight semantic memory with knowledge graphs. |
-| **Session continuity** | Resume sessions across restarts with freshness gating. |
-| **Encrypted vault** | AES-256-GCM for secrets. |
-| **12 Telegram MCP tools** | Reply, stream replies, pin, react, history, attachments, native checklists, all of it. |
+Tools that touch the world — Bash, Edit, Write, anything not on an agent's pre-approved allowlist — pause for explicit approval. Switchroom's **approval kernel** (shipped in v0.5.1) routes every gated tool call through an inline Telegram card with the actual diff or command shown. Tap Allow and the tool resumes. Tap Deny and the agent gets a clean refusal it can recover from.
+<p align="center"><img src="docs/diagrams/approval-grant-flow.jpg" width="700" alt="Approval grant flow: agent tool call pauses at the kernel, broker writes pending grant to sqlite, user taps Allow on the Telegram card, broker releases the gate, tool resumes"></p>
+- **Inline cards.** Allow / Deny / Allow once / Allow for 1h. No leaving Telegram.
+- **TTL'd grants.** "Allow Bash for 1h" expires automatically. No silent permanent escalation.
+- **Audit trail.** Every grant, denial, and expiry written to a per-agent log you can replay.
+- **Per-agent allowlist.** `switchroom agent grant <name> <tool>` for the boring ones you don't want to be asked about.
+The kernel runs as an out-of-process broker over a unix socket. The agent process never decides its own permissions; it asks and waits.
+### Compliance posture
-## How it stacks up against the alternatives
+Switchroom never intercepts auth, never proxies inference, never patches the CLI. The `claude` binary you run is the one Anthropic ships. See the [Compliance Attestation](docs/compliance-attestation.md) for the full analysis against Anthropic's April 2026 third-party policy.
+## Survives real life
+Each agent is a long-running service. They survive reboots, network drops, and your laptop closing. But "always on" isn't enough on its own. Things still die. The product has to handle that gracefully or the illusion breaks.
+<p align="center"><img src="docs/diagrams/wake-audit-lifecycle.jpg" width="700" alt="Wake-audit lifecycle: kill, crash-pane snapshot, auto-restart, agent boots with SWITCHROOM_PENDING_TURN, acks with three options"></p>
+- **Auto-restart.** Agent containers come up with `restart: unless-stopped`, and each service has a healthcheck — a crashed or wedged agent is brought back automatically. No silent dropped work.
+- **Resume protocol.** When an agent reboots mid-turn, `start.sh` exports `SWITCHROOM_PENDING_TURN=true` plus the original chat / message ids. The agent's first action on boot is to acknowledge the gap and ask the user how to proceed (start over, summarise and continue, or drop it).
+- **Wake-audit.** On every fresh boot the agent checks for owed replies, orphan sub-agents, and stale in-progress todos. If everything's clean it stays quiet. If it owed you a reply, it tells you.
+- **Token refresh.** Runs unattended for weeks via a `refresh-tick` daemon. Multi-account fallback pool kicks in when the active slot hits its quota window.
+## How it stacks up
 | | Switchroom | Claude Code channels | OpenClaw | NanoClaw |
 |---|---|---|---|---|
-| Progress visibility | Live progress cards, pinned | None, black box | None | None |
+| Progress visibility | Live cards, pinned | Black box | None | None |
 | Runtime | Claude Code CLI | Claude Code CLI | Custom runtime | Agents SDK |
 | Auth | Pro/Max OAuth | Pro/Max OAuth | API key | API key |
-| Sub-agent tracking | Yes, visible in card | No | No | No |
+| Sub-agent tracking | Yes, in card | No | No | No |
 | Parallel task display | Labelled cards `(1/N)` | No | No | No |
+| Approval UX | Inline Telegram cards | None | None | None |
 | Config | YAML with cascade | None | JSON/TOML | Env vars |
 | Setup | `switchroom setup` | Built-in (limited) | Docker compose | Docker compose |
+The wedge against OpenClaw and NanoClaw isn't the substrate — it's the stock `claude` CLI under your subscription, instead of a custom runtime under your API key.
 ## Install
-Ubuntu 24.04 LTS, 4GB RAM. Linux only.
+Runs on the box you already have. The supported production runtime is Linux + Docker (Ubuntu 24.04 LTS with 4GB RAM is the canonical target; other Linux distros work with minor tweaks). `switchroom apply` scaffolds every agent and writes a `docker-compose.yml` from your `switchroom.yaml`; you bring the fleet up yourself with `docker compose -p switchroom -f ~/.switchroom/compose/docker-compose.yml up -d`. Five published images on GHCR (`switchroom-base`, `switchroom-agent`, `switchroom-broker`, `switchroom-kernel`, `switchroom-scheduler`) — no `docker build` on the operator's host. macOS (Docker Desktop) works for development but is not yet release-validated.
+> **Heads up on the package name.** The npm package was originally `switchroom-ai`. It's now just `switchroom`. The old name is deprecated and will stop receiving updates — `npm install -g switchroom` is the current path.
 ### From inside Claude Code (the on-ramp)
@@ -111,15 +152,32 @@ If you already use Claude Code, this is the shortest path. Inside any session:
 /switchroom:setup
 ```
-`/switchroom:setup` walks you through deps, `switchroom setup` (Telegram + vault + first agent), and `switchroom agent start`. Once it's done you have `/switchroom:start`, `/switchroom:stop`, and `/switchroom:status` for day-to-day. See [`docs/publishing.md`](docs/publishing.md).
+`/switchroom:setup` walks you through deps, `switchroom setup` (Telegram + vault + first agent), and `switchroom agent start`. Day-to-day: `/switchroom:start`, `/switchroom:stop`, `/switchroom:status`. See [`docs/publishing.md`](docs/publishing.md).
-### One-liner (fresh box)
+### One-liner (static binary)
 ```bash
-curl -fsSL https://get.switchroom.ai | bash
+curl -fsSL https://github.com/switchroom/switchroom/raw/main/install.sh | sh
 ```
-Bootstraps bun, node 22, the claude CLI, and switchroom. Idempotent. Safe to re-run. Source is [`install.sh`](install.sh) in this repo.
+Auto-detects your platform (linux / macos) and arch (amd64 / arm64), downloads the matching pre-built binary from the latest [GitHub release](https://github.com/switchroom/switchroom/releases/latest), verifies its SHA256, and drops it in `/usr/local/bin` (or `~/.local/bin` if not writable). Source is [`install.sh`](install.sh).
+The static binary still needs the `claude` CLI to run agents: `npm i -g @anthropic-ai/claude-code` (Node 20.11+).
+**Manual install** if you'd rather not pipe to sh:
+```bash
+# Pick the artifact for your platform/arch from the latest release page
+curl -fsSL -o switchroom https://github.com/switchroom/switchroom/releases/latest/download/switchroom-linux-amd64
+chmod +x switchroom
+sudo mv switchroom /usr/local/bin/
+```
+Replace `switchroom-linux-amd64` with `switchroom-linux-arm64`, `switchroom-macos-amd64`, or `switchroom-macos-arm64` as needed. Verify against `switchroom-checksums.txt` from the same release.
+**macOS Gatekeeper note.** Releases are not yet Apple-code-signed. After installing on macOS you may need to clear the quarantine xattr so the binary will run: `xattr -d com.apple.quarantine /usr/local/bin/switchroom`. The `install.sh` one-liner handles this automatically.
+**Mac (Sequoia+) one-time.** macOS 15 adds a second-stage notarization check that the `xattr` strip alone does not bypass — you may still see a Gatekeeper "cannot verify the developer" dialog the first time you run `switchroom`. `install.sh` attempts `sudo spctl --add /usr/local/bin/switchroom` automatically (best-effort, ignored if sudo isn't available). If the dialog still fires, run that `spctl --add` manually, or open System Settings → Privacy & Security → "Open Anyway" once.
 Then:
@@ -127,7 +185,8 @@ Then:
 switchroom setup                                        # interactive Telegram wiring
 switchroom agent create coach --profile health-coach    # scaffold your first agent
 switchroom auth login coach                             # link your Pro or Max session
-switchroom agent start coach                            # go
+switchroom apply                                        # write docker-compose.yml
+docker compose -p switchroom -f ~/.switchroom/compose/docker-compose.yml up -d
 ```
 After the last command you talk to the agent from Telegram. You don't touch the server again.
@@ -139,7 +198,7 @@ npm install -g @anthropic-ai/claude-code switchroom
 switchroom setup
 ```
-Node 20.11+. `switchroom setup` is the interactive first-time wizard — scaffolds config, handles Telegram wiring, sets up the vault.
+Node 20.11+. `switchroom setup` is the interactive first-time wizard. Scaffolds config, handles Telegram wiring, sets up the vault.
 ### One-shot happy path (no wizard)
@@ -148,18 +207,18 @@ If you already have Telegram credentials in `~/.switchroom/switchroom.yaml`, ski
 ```bash
 switchroom agent create coach --profile health-coach
 switchroom auth login coach
-switchroom agent start coach
+switchroom apply && docker compose -p switchroom -f ~/.switchroom/compose/docker-compose.yml up -d
 ```
-## Example Configuration
+## Example configuration
 ```yaml
 switchroom:
   version: 1
 telegram:
+  # Per-agent bot token (DM-only by default).
   bot_token: "vault:telegram-bot-token"
-  forum_chat_id: "-1001234567890"
 memory:
   backend: hindsight
@@ -195,11 +254,7 @@ See [docs/configuration.md](docs/configuration.md) for the full reference.
 ## Vault broker (cron secrets)
-Scheduled tasks run headless via `systemd --user` timers, so they cannot prompt
-for the vault passphrase. The vault broker is a long-running user-level systemd
-unit that holds the vault decrypted in memory after a one-time interactive
-unlock. Cron tasks fetch the specific keys they declare via a unix socket; the
-passphrase never sits on disk.
+Scheduled tasks run headless inside the agent container, so they can't prompt for the vault passphrase. The vault broker is a long-running container (`switchroom-broker`) that holds the vault decrypted in memory after a one-time interactive unlock. Cron tasks fetch the specific keys they declare via a host-shared unix socket. The passphrase never sits on disk.
 **Declare per-cron secrets in `switchroom.yaml`:**
@@ -217,69 +272,39 @@ agents:
 **Bootstrap once per host:**
 ```bash
-switchroom update                       # installs the broker systemd unit
+switchroom apply                        # writes broker into docker-compose.yml
+docker compose -p switchroom -f ~/.switchroom/compose/docker-compose.yml up -d switchroom-broker
 switchroom vault broker unlock          # prompt for passphrase, primes broker
 ```
-Or just run `switchroom vault get <key>` from a TTY — the broker offers to
-take the unlocked state with `[Y/n]` so you don't have to remember a separate
-unlock command.
+Or just run `switchroom vault get <key>` from a TTY. The broker offers to take the unlocked state with `[Y/n]` so you don't have to remember a separate unlock command.
-**Identity model.** On Linux, the broker reads `/proc/<pid>/cgroup` to find
-the connecting cron's systemd unit (`switchroom-<agent>-cron-<i>.service`).
-Cgroup membership is set by systemd as root and is unspoofable from
-userspace, so a compromised agent cannot pose as another agent's cron and
-read its keys. macOS and other platforms degrade to UID-only via the socket
-file mode 0600 — fine for desktop use, not recommended for production cron.
+**Identity model.** The broker reads `/proc/<pid>/cgroup` on the host to find the connecting cron's container (`switchroom-<agent>-scheduler` or `switchroom-<agent>`), which Docker sets unspoofably from userspace, so a compromised agent cannot pose as another agent's cron and read its keys. macOS (Docker Desktop) degrades to UID-only via the socket file mode 0600. Fine for desktop use, not recommended for production cron.
-The broker locks on `SIGTERM` (so a `restart` zeros the in-memory state)
-and on demand via `switchroom vault broker lock`. Use
-`switchroom vault get <key> --no-broker` to bypass and prompt locally.
+The broker locks on `SIGTERM` (so a container restart zeros the in-memory state) and on demand via `switchroom vault broker lock`. Use `switchroom vault get <key> --no-broker` to bypass and prompt locally.
-Unit installed at `~/.config/systemd/user/switchroom-vault-broker.service`.
+Broker socket lives at `~/.switchroom/vault-broker.sock` (host-mounted into every agent container).
 ### Auto-unlock on boot (opt-in)
-By default, the broker holds the unlocked state in memory only — every
-restart (host reboot, service crash, reconcile that re-renders the unit)
-wipes it and requires `switchroom vault broker unlock` again. For
-unattended hosts where this is too painful, switchroom can encrypt the
-passphrase with a key derived from `/etc/machine-id` and have the broker
-unlock itself at boot:
+By default, the broker holds the unlocked state in memory only. Every restart (host reboot, service crash, reconcile that re-renders the unit) wipes it and requires `switchroom vault broker unlock` again. For unattended hosts where this is too painful, switchroom can encrypt the passphrase with a key derived from `/etc/machine-id` and have the broker unlock itself at boot:
 ```bash
 switchroom vault broker enable-auto-unlock   # one-time setup, prompts for passphrase
 ```
-Done. The wizard prompts for your vault passphrase, encrypts it with
-AES-256-GCM keyed off `/etc/machine-id`, writes the result to
-`~/.config/switchroom/auto-unlock.bin` (mode 0600), flips
-`vault.broker.autoUnlock: true` in `switchroom.yaml`, restarts the
-broker, and verifies the vault came up unlocked. Every subsequent boot
-the broker reads + decrypts + unlocks itself.
+Done. The wizard prompts for your vault passphrase, encrypts it with AES-256-GCM keyed off `/etc/machine-id`, writes the result to `~/.switchroom/vault-auto-unlock` (mode 0600), flips `vault.broker.autoUnlock: true` in `switchroom.yaml`, restarts the broker, and verifies the vault came up unlocked. Every subsequent boot the broker reads + decrypts + unlocks itself.
 Disable with `switchroom vault broker disable-auto-unlock`.
-**Security tradeoff — read this before enabling.** The encrypted blob
-lives at mode 0600 in your home directory; the encryption key is
-derived from `/etc/machine-id` plus a per-file random salt. This means
-disk theft is safe (the blob doesn't decrypt on any other machine) and
-other UNIX users on the same box can't read it — but root on the host
-*can* read both the blob and the machine-id, so once root is on the
-machine the passphrase is recoverable. Same blast radius as the
-running broker process (anything with code-exec as you can already
-attach to the broker socket and exfiltrate secrets), but it shifts the
-convenience-vs-security knob: auto-unlock means a lost laptop is a lost
-vault even if the vault file itself is encrypted at rest. Use only on
-hosts you trust. See [docs/auto-unlock.md](docs/auto-unlock.md) for the
-full threat model and recovery instructions.
-## CLI Reference
+**Security tradeoff. Read this before enabling.** The encrypted blob lives at mode 0600 in your home directory; the encryption key is derived from `/etc/machine-id` plus a per-file random salt. Disk theft is safe (the blob doesn't decrypt on any other machine) and other UNIX users on the same box can't read it. But root on the host *can* read both the blob and the machine-id, so once root is on the machine the passphrase is recoverable. Same blast radius as the running broker process (anything with code-exec as you can already attach to the broker socket and exfiltrate secrets), but it shifts the convenience-vs-security knob: auto-unlock means a lost laptop is a lost vault even if the vault file itself is encrypted at rest. Use only on hosts you trust. See [docs/auto-unlock.md](docs/auto-unlock.md) for the full threat model and recovery instructions.
+## CLI reference
 ```bash
 switchroom setup                              # Interactive wizard
 switchroom doctor                             # Health check
-switchroom update                             # Pull latest + rebuild + reconcile + restart
+switchroom apply                              # Reconcile + (re)write docker-compose.yml; bring fleet up via `docker compose ... up -d`
 switchroom restart [agent] [--force]          # Bounce agent(s); drains in-flight turn by default
 switchroom version                            # Show versions + running agent health summary
@@ -292,7 +317,7 @@ switchroom agent reconcile <name|all>         # Re-apply switchroom.yaml (withou
 switchroom agent start|stop|restart <name>    # Lifecycle (with preflight)
 switchroom agent interrupt <name>             # Cancel in-flight turn without restarting
 switchroom agent rename <old> <new>           # Rename an agent slug (#168)
-switchroom agent destroy <name>               # Tear down systemd units + scaffold dir
+switchroom agent destroy <name>               # Remove from compose + scaffold dir
 switchroom agent attach <name>                # Interactive tmux session
 switchroom agent logs <name> [-f]             # View logs
 switchroom agent grant <name> <tool>          # Grant a tool permission
@@ -305,7 +330,7 @@ Profiles live in `profiles/` at the repo root. Bundled ones for `--profile`: `co
 `switchroom agent create <name> --profile <profile>` does two things in one step:
 1. Adds an entry to `switchroom.yaml` under `agents:` with `extends: <profile>` and a derived `topic_name` (capitalized agent name). Edit the yaml afterwards to change the topic name, emoji, tools, etc.
-2. Scaffolds the agent directory and installs the systemd unit (same as running `agent create` on an entry that already exists in yaml).
+2. Scaffolds the agent directory and registers the agent in `docker-compose.yml` on next `switchroom apply` (same as running `agent create` on an entry that already exists in yaml).
 If the agent is already in yaml, `--profile` must match the existing `extends:` value or it errors. If the yaml entry has no `extends:` and you pass `--profile`, the flag is written in additively with a warning. Running `agent create` with no `--profile` on a missing entry keeps the old "Agent not defined in switchroom.yaml" error, now with a hint to use `--profile`.
@@ -313,10 +338,7 @@ Model aliases: the bare names `opus`, `sonnet`, `haiku` are accepted alongside t
 ### Authentication (multi-account slot pool)
-Each agent has a pool of Claude OAuth slots. The **active** slot is what
-the agent uses; other slots are automatic fallbacks when the active slot
-hits its quota window. Every `<slot>` option defaults to the active slot
-if omitted.
+Each agent has a pool of Claude OAuth slots. The **active** slot is what the agent uses; other slots are automatic fallbacks when the active slot hits its quota window. Every `<slot>` option defaults to the active slot if omitted.
 ```bash
 switchroom auth status                            # All agents, one table
@@ -333,15 +355,11 @@ switchroom auth list <agent> [--json]             # Show slots: health, quota st
 switchroom auth rm <agent> <slot> [--force]       # Remove a slot (refuses active/last slot)
 ```
-The fallback pool also works from Telegram. The switchroom MCP plugin
-exposes the same verbs as `/auth add|use|list|rm` inside the chat.
+The fallback pool also works from Telegram. The switchroom MCP plugin exposes the same verbs as `/auth add|use|list|rm` inside the chat.
 ### Workspace (agent bootstrap layer)
-Each agent has a workspace directory (`~/.switchroom/agents/<name>/workspace/`)
-with editable stable files (`AGENTS.md`, `SOUL.md`, `USER.md`, `IDENTITY.md`,
-`TOOLS.md`) and dynamic files (`MEMORY.md`, `memory/YYYY-MM-DD.md`,
-`HEARTBEAT.md`) that are injected into the model's context at turn time.
+Each agent has a workspace directory (`~/.switchroom/agents/<name>/workspace/`) with editable stable files (`AGENTS.md`, `SOUL.md`, `USER.md`, `IDENTITY.md`, `TOOLS.md`) and dynamic files (`MEMORY.md`, `memory/YYYY-MM-DD.md`, `HEARTBEAT.md`) that are injected into the model's context at turn time.
 ```bash
 switchroom workspace path <agent>                 # Print the workspace dir
@@ -361,6 +379,8 @@ switchroom debug turn <agent>                     # Dump the exact prompt layeri
 switchroom memory setup|search|stats|reflect      # Hindsight memory
 ```
+The progress card driver also writes a per-agent `card-events.jsonl` audit log: every edit, pin, unpin, and tool-label transition the user sees in Telegram, captured locally so a debug session doesn't depend on Telegram's history. Tail it like any other journal.
 ### Other
 ```bash
@@ -374,7 +394,7 @@ switchroom web                                    # Web dashboard
 `scripts/import-openclaw-credentials.ts` is a one-shot migration script that lifts `/data/openclaw-config/credentials/` into the Switchroom vault. It ships with a small set of default mappings for filenames OpenClaw documents out of the box.
-User-specific credential filenames (your custom bot tokens, SSH keys, and so on) belong in a local overlay file — not in the source repository. Create `~/.switchroom/import-openclaw.yaml`:
+User-specific credential filenames (your custom bot tokens, SSH keys, and so on) belong in a local overlay file, not the source repository. Create `~/.switchroom/import-openclaw.yaml`:
 ```yaml
 # ~/.switchroom/import-openclaw.yaml
@@ -395,12 +415,13 @@ Overlay entries win on collision with built-in defaults. Unknown files that appe
 ## Documentation
 | Guide | Description |
-|-------|-------------|
+|---|---|
+| **[Changelog](CHANGELOG.md)** | Release notes, every version |
 | **[Configuration](docs/configuration.md)** | Full field reference, cascade semantics, profiles |
 | **[Vault](docs/vault.md)** | Architecture, per-cron secrets, ACL, audit log, threat model |
-| **[Telegram Plugin](docs/telegram-plugin.md)** | Progress cards, 10 MCP tools, emoji reactions |
+| **[Telegram Plugin](docs/telegram-plugin.md)** | Progress cards, 15 MCP tools, native checklists, sticker aliases, voice-in |
 | **[Sub-Agents](docs/sub-agents.md)** | Model routing, delegation patterns, frontmatter spec |
-| **[Scheduling](docs/scheduling.md)** | Cron tasks, systemd timers, model selection |
+| **[Scheduling](docs/scheduling.md)** | Cron tasks (per-agent scheduler container), model selection |
 | **[Session Management](docs/session-optimization.md)** | Continuity, compaction, freshness policy |
 | **[OpenClaw alternative](docs/vs-openclaw.md)** | Switchroom vs OpenClaw |
 | **[NanoClaw alternative](docs/vs-nanoclaw.md)** | Switchroom vs NanoClaw |
@@ -409,7 +430,7 @@ Overlay entries win on collision with built-in defaults. Unknown files that appe
 ## Telemetry
-Switchroom reports anonymous usage events and errors to PostHog so we can spot regressions and understand which commands are used. **No personal data, code, or message content leaves your machine.** The anonymous ID lives at `~/.switchroom/analytics-id` and is a random UUID. Not tied to your username, email, IP, or machine identifier (we pass `disableGeoip: true` on every event).
+Switchroom reports anonymous usage events and errors to PostHog so I can spot regressions and understand which commands are used. **No personal data, code, or message content leaves your machine.** The anonymous ID lives at `~/.switchroom/analytics-id` and is a random UUID. Not tied to your username, email, IP, or machine identifier (we pass `disableGeoip: true` on every event).
 To opt out, set this in your shell profile:
@@ -431,7 +452,7 @@ The built-in channel is message in, message out, with zero visibility into what
 Yes. Each agent gets its own Telegram forum topic. When multiple agents are working simultaneously, each has its own pinned progress card labelled `(1/N)`, `(2/N)` and so on.
 **Can I see what sub-agents are doing?**
-Yes. When an agent delegates to a sub-agent (a worker, a researcher), the sub-agent's activity shows up in its own section of the progress card. You see the full hierarchy, not just the top-level agent.
+Yes. When an agent delegates to a sub-agent (a worker, a researcher), the sub-agent's activity shows up in its own indented section of the parent's progress card. You see the full hierarchy, not just the top-level agent.
 **What does it cost to run?**
 A cheap Linux VPS (around $6/mo on Hetzner, DigitalOcean, wherever), plus your existing Claude Pro ($20/mo) or Max ($100/mo) subscription. Switchroom itself is MIT-licensed, free.

package/bin/autoaccept.exp CHANGED Viewed

@@ -34,13 +34,36 @@ expect {
         # spawned shell. Without this the loop hangs forever and expect
         # owns stdin, dropping any injected keystrokes.
     }
+    -re {Loading.{1,30}development.{1,30}channels} {
+        # NEW dev-channels prompt wording (Claude Code mid-2026+):
+        #   WARNING: Loading development channels
+        #   ❯ 1. I am using this for local development
+        #     2. Exit
+        # Option 1 ("local development") is already highlighted, so just
+        # press Enter — no Down keystroke needed. Tightly scoped to the
+        # literal "Loading … development channels" warning header so we
+        # don't over-match anywhere else.
+        sleep 0.5
+        send "\r"
+        exp_continue
+    }
+    -re {using this for local development} {
+        # Belt-and-suspenders for the new prompt: match on the option-row
+        # text in case the WARNING header has scrolled out of the capture
+        # window. Same scoping discipline — "local development" is unique
+        # to this prompt and won't appear in per-tool confirmations.
+        sleep 0.5
+        send "\r"
+        exp_continue
+    }
     -re {I.{0,5}accept.{0,80}development.{0,10}channels} {
-        # Dev-channels acknowledgement — shown once per machine when
-        # --dangerously-load-development-channels is first used. Tightly
-        # scoped to the literal "development channels" phrase to avoid
-        # over-matching per-tool confirmations that start with "Yes, I
-        # accept" e.g. "Yes, I accept this file edit." Those must fall
-        # through to the plugin's permission_request flow.
+        # LEGACY dev-channels acknowledgement — old wording before the
+        # 2026 TUI rename ("Yes, I accept the use of development channels").
+        # Kept as a fallback for older Claude Code releases. Tightly scoped
+        # to the literal "development channels" phrase to avoid over-matching
+        # per-tool confirmations that start with "Yes, I accept" e.g.
+        # "Yes, I accept this file edit." Those must fall through to the
+        # plugin's permission_request flow.
         sleep 0.5
         send "\033\[B\r"
         exp_continue