npm - switchroom - Versions diffs - 0.7.15 → 0.10.0 - Mend

switchroom 0.7.15 → 0.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (301) hide show

package/README.md +51 -59
package/bin/run-hook.sh +27 -11
package/bin/timezone-hook.sh +9 -7
package/dist/agent-scheduler/index.js +410 -133
package/dist/auth-broker/index.js +13932 -0
package/dist/cli/switchroom.js +26937 -5601
package/dist/host-control/main.js +12702 -0
package/dist/vault/approvals/kernel-server.js +467 -184
package/dist/vault/broker/server.js +1430 -724
package/examples/minimal.yaml +63 -0
package/examples/personal-google-workspace-mcp/.env.example +34 -0
package/examples/personal-google-workspace-mcp/README.md +194 -0
package/examples/personal-google-workspace-mcp/compose.yaml +66 -0
package/examples/switchroom.yaml +220 -0
package/package.json +7 -4
package/profiles/_base/settings.json.hbs +20 -5
package/profiles/_base/start.sh.hbs +16 -3
package/profiles/_shared/agent-self-service.md.hbs +126 -0
package/profiles/_shared/telegram-style.md.hbs +20 -90
package/profiles/_shared/vault-protocol.md.hbs +68 -0
package/profiles/default/CLAUDE.md +50 -96
package/profiles/default/CLAUDE.md.hbs +36 -6
package/profiles/default/workspace/SOUL.md.hbs +12 -5
package/skills/buildkite-agent-infrastructure/SKILL.md +30 -11
package/skills/buildkite-agent-runtime/SKILL.md +44 -11
package/skills/buildkite-api/SKILL.md +31 -8
package/skills/buildkite-cli/SKILL.md +27 -9
package/skills/buildkite-migration/SKILL.md +22 -9
package/skills/buildkite-pipelines/SKILL.md +26 -9
package/skills/buildkite-secure-delivery/SKILL.md +23 -9
package/skills/buildkite-test-engine/SKILL.md +25 -8
package/skills/docx/SKILL.md +1 -1
package/skills/docx/scripts/office/validators/__pycache__/__init__.cpython-313.pyc +0 -0
package/skills/docx/scripts/office/validators/__pycache__/base.cpython-313.pyc +0 -0
package/skills/file-bug/SKILL.md +34 -6
package/skills/humanizer/SKILL.md +15 -0
package/skills/humanizer-calibrate/SKILL.md +7 -1
package/skills/mcp-builder/SKILL.md +1 -1
package/skills/pdf/SKILL.md +1 -1
package/skills/pptx/SKILL.md +1 -1
package/skills/skill-creator/SKILL.md +21 -1
package/skills/skill-creator/scripts/__pycache__/__init__.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/generate_report.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/improve_description.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/run_eval.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/run_loop.cpython-313.pyc +0 -0
package/skills/skill-creator/scripts/__pycache__/utils.cpython-313.pyc +0 -0
package/skills/switchroom-cli/SKILL.md +63 -64
package/skills/switchroom-health/SKILL.md +23 -10
package/skills/switchroom-install/SKILL.md +3 -3
package/skills/switchroom-manage/SKILL.md +26 -19
package/skills/switchroom-runtime/SKILL.md +191 -0
package/skills/switchroom-status/SKILL.md +27 -2
package/skills/telegram-test-harness/SKILL.md +3 -0
package/skills/token-helpers/SKILL.md +24 -1
package/skills/webapp-testing/SKILL.md +31 -1
package/skills/xlsx/SKILL.md +1 -1
package/telegram-plugin/admin-commands/index.ts +7 -5
package/telegram-plugin/analytics-posthog.ts +191 -0
package/telegram-plugin/bridge/bridge.ts +69 -0
package/telegram-plugin/bridge/ipc-client.ts +4 -1
package/telegram-plugin/dist/bridge/bridge.js +194 -119
package/telegram-plugin/dist/gateway/gateway.js +23611 -19671
package/telegram-plugin/dist/server.js +245 -189
package/telegram-plugin/first-paint.ts +3 -24
package/telegram-plugin/gateway/auth-add-flow.ts +326 -0
package/telegram-plugin/gateway/auth-broker-client.ts +75 -0
package/telegram-plugin/gateway/auth-command.ts +794 -0
package/telegram-plugin/gateway/auth-line.ts +123 -0
package/telegram-plugin/gateway/boot-card.ts +169 -40
package/telegram-plugin/gateway/boot-issue-cache.ts +308 -0
package/telegram-plugin/gateway/boot-probes.ts +166 -123
package/telegram-plugin/gateway/boot-reason.ts +41 -7
package/telegram-plugin/gateway/boot-version.ts +66 -0
package/telegram-plugin/gateway/gateway.ts +3499 -1885
package/telegram-plugin/gateway/hostd-dispatch.ts +117 -0
package/telegram-plugin/gateway/ipc-protocol.ts +18 -0
package/telegram-plugin/gateway/pending-inbound-buffer.ts +106 -0
package/telegram-plugin/gateway/quarantine.ts +69 -0
package/telegram-plugin/gateway/quota-cache.ts +9 -4
package/telegram-plugin/gateway/reaction-trigger.ts +401 -0
package/telegram-plugin/gateway/recent-denials.test.ts +103 -0
package/telegram-plugin/gateway/recent-denials.ts +77 -0
package/telegram-plugin/gateway/startup-network-retry.ts +109 -31
package/telegram-plugin/gateway/vault-grant-inbound-builders.ts +125 -0
package/telegram-plugin/history.ts +91 -0
package/telegram-plugin/hooks/hooks.json +10 -0
package/telegram-plugin/hooks/sandbox-hint-posttool.mjs +130 -0
package/telegram-plugin/hooks/subagent-tracker-posttool.mjs +19 -2
package/telegram-plugin/hooks/subagent-tracker-pretool.mjs +22 -2
package/telegram-plugin/hooks/tool-label-pretool.mjs +11 -0
package/telegram-plugin/hooks/wedge-detect-posttool.mjs +303 -0
package/telegram-plugin/inbound-classifier.ts +50 -0
package/telegram-plugin/inline-keyboard-callbacks.ts +136 -0
package/telegram-plugin/node_modules/.vite/vitest/da39a3ee5e6b4b0d3255bfef95601890afd80709/results.json +1 -0
package/telegram-plugin/package.json +4 -2
package/telegram-plugin/permission-rule.ts +51 -0
package/telegram-plugin/permission-title.ts +56 -0
package/telegram-plugin/quota-check.ts +19 -41
package/telegram-plugin/registry/reaper.ts +223 -0
package/telegram-plugin/retry-api-call.ts +80 -0
package/telegram-plugin/runtime-metrics.ts +177 -0
package/telegram-plugin/scripts/build.mjs +0 -1
package/telegram-plugin/secret-detect/index.ts +24 -0
package/telegram-plugin/secret-detect/vault-error.test.ts +64 -12
package/telegram-plugin/secret-detect/vault-error.ts +78 -11
package/telegram-plugin/secret-detect/vault-write.ts +14 -2
package/telegram-plugin/server.js +41795 -0
package/telegram-plugin/session-tail.ts +6 -1
package/telegram-plugin/shared/bot-runtime.ts +5 -4
package/telegram-plugin/silence-poke.ts +420 -0
package/telegram-plugin/silent-end.ts +174 -0
package/telegram-plugin/stream-controller.ts +13 -0
package/telegram-plugin/stream-reply-handler.ts +7 -0
package/telegram-plugin/subagent-watcher.ts +213 -4
package/telegram-plugin/tests/auth-add-flow.test.ts +559 -0
package/telegram-plugin/tests/auth-code-redact.test.ts +8 -4
package/telegram-plugin/tests/auth-command-vernacular.test.ts +531 -0
package/telegram-plugin/tests/boot-card-issue-dedup.test.ts +247 -0
package/telegram-plugin/tests/boot-card-reason-to-render.test.ts +182 -0
package/telegram-plugin/tests/boot-card-reason.test.ts +65 -2
package/telegram-plugin/tests/boot-card-render.test.ts +146 -0
package/telegram-plugin/tests/boot-card-silent-on-operator.test.ts +103 -0
package/telegram-plugin/tests/boot-probes.test.ts +216 -10
package/telegram-plugin/tests/boot-version-string.test.ts +0 -0
package/telegram-plugin/tests/finalize-callback.test.ts +190 -0
package/telegram-plugin/tests/gateway-message-validator.test.ts +26 -0
package/telegram-plugin/tests/gateway-secret-detect.test.ts +12 -3
package/telegram-plugin/tests/gateway-startup-network-retry.test.ts +104 -0
package/telegram-plugin/tests/history-reaper.test.ts +378 -0
package/telegram-plugin/tests/hostd-dispatch.test.ts +129 -0
package/telegram-plugin/tests/inbound-classifier.test.ts +76 -0
package/telegram-plugin/tests/inbound-message-types.test.ts +267 -0
package/telegram-plugin/tests/issues-card.test.ts +49 -0
package/telegram-plugin/tests/pending-inbound-buffer.test.ts +132 -0
package/telegram-plugin/tests/permission-rule.test.ts +80 -1
package/telegram-plugin/tests/permission-title.test.ts +31 -0
package/telegram-plugin/tests/quota-check.test.ts +5 -35
package/telegram-plugin/tests/races.test.ts +179 -0
package/telegram-plugin/tests/reaction-trigger-flow.test.ts +353 -0
package/telegram-plugin/tests/reaction-trigger.test.ts +397 -0
package/telegram-plugin/tests/retry-api-call.test.ts +152 -1
package/telegram-plugin/tests/runtime-metrics.test.ts +145 -0
package/telegram-plugin/tests/sandbox-hint-posttool.test.ts +155 -0
package/telegram-plugin/tests/secret-detect-delete-must-surface-failures.test.ts +133 -0
package/telegram-plugin/tests/secret-detect-false-positives.test.ts +137 -0
package/telegram-plugin/tests/silence-poke.test.ts +493 -0
package/telegram-plugin/tests/silent-end.test.ts +206 -0
package/telegram-plugin/tests/subagent-tracker-hooks.test.ts +107 -0
package/telegram-plugin/tests/subagent-watcher-env-thresholds.test.ts +224 -0
package/telegram-plugin/tests/subagent-watcher-stall-terminal.test.ts +316 -0
package/telegram-plugin/tests/subagent-watcher.test.ts +263 -0
package/telegram-plugin/tests/turn-signal-tracker.test.ts +81 -0
package/telegram-plugin/tests/vault-approval-posture.test.ts +256 -0
package/telegram-plugin/tests/vault-grant-auto-resume.test.ts +73 -0
package/telegram-plugin/tests/vault-grant-inbound-builders.test.ts +226 -0
package/telegram-plugin/tests/vault-grant-union.test.ts +130 -0
package/telegram-plugin/tests/vault-key-regex-allows-slash.test.ts +140 -0
package/telegram-plugin/tests/vault-posture-quarantine.test.ts +104 -0
package/telegram-plugin/tests/vault-request-access-tool.test.ts +114 -0
package/telegram-plugin/tests/vault-request-access-unlock-resume.test.ts +106 -0
package/telegram-plugin/turn-signal-tracker.ts +100 -24
package/telegram-plugin/uat/SETUP.md +210 -35
package/telegram-plugin/uat/assertions.ts +264 -37
package/telegram-plugin/uat/driver-info.ts +57 -0
package/telegram-plugin/uat/driver.ts +590 -51
package/telegram-plugin/uat/harness.ts +140 -94
package/telegram-plugin/uat/load-env.test.ts +72 -0
package/telegram-plugin/uat/load-env.ts +48 -0
package/telegram-plugin/uat/login.ts +96 -53
package/telegram-plugin/uat/runners/agent-self-sufficiency.ts +457 -0
package/telegram-plugin/uat/runners/paraphrases.ts +231 -0
package/telegram-plugin/uat/runners/report.ts +150 -0
package/telegram-plugin/uat/runners/run-agent-self-sufficiency.sh +50 -0
package/telegram-plugin/uat/runners/scorer.test.ts +196 -0
package/telegram-plugin/uat/runners/scorer.ts +106 -0
package/telegram-plugin/uat/runners/skill-coverage.test.ts +100 -0
package/telegram-plugin/uat/runners/skill-coverage.ts +620 -0
package/telegram-plugin/uat/scenarios/ask-user-button-tap-dm.test.ts +141 -0
package/telegram-plugin/uat/scenarios/bg-sub-agent-dispatch-dm.test.ts +191 -0
package/telegram-plugin/uat/scenarios/fuzz-extended-dm.test.ts +255 -0
package/telegram-plugin/uat/scenarios/fuzz-human-style-dm.test.ts +275 -0
package/telegram-plugin/uat/scenarios/fuzz-random-prompts-dm.test.ts +146 -0
package/telegram-plugin/uat/scenarios/fuzz-status-ask-dm.test.ts +486 -0
package/telegram-plugin/uat/scenarios/jtbd-interrupt-marker-dm.test.ts +67 -0
package/telegram-plugin/uat/scenarios/jtbd-rapid-followup-dm.test.ts +100 -0
package/telegram-plugin/uat/scenarios/jtbd-soft-commit-dm.test.ts +67 -0
package/telegram-plugin/uat/scenarios/jtbd-status-query-dm.test.ts +49 -0
package/telegram-plugin/uat/scenarios/location-inbound-dm.test.ts +65 -0
package/telegram-plugin/uat/scenarios/midturn-silent-dm.test.ts +175 -0
package/telegram-plugin/uat/scenarios/reactions-dm.test.ts +142 -0
package/telegram-plugin/uat/scenarios/reactions-trigger-turn-dm.test.ts +96 -0
package/telegram-plugin/uat/scenarios/secret-redaction-deletes-original-dm.test.ts +123 -0
package/telegram-plugin/uat/scenarios/secret-redaction-no-false-positive-dm.test.ts +87 -0
package/telegram-plugin/uat/scenarios/silence-poke-soft-dm.test.ts +155 -0
package/telegram-plugin/uat/scenarios/silent-end-recovery-dm.test.ts +95 -0
package/telegram-plugin/uat/scenarios/smoke-dm-reply.test.ts +57 -0
package/telegram-plugin/uat/scenarios/subagent-watcher-no-rerun-dm.test.ts +135 -0
package/telegram-plugin/uat/scenarios/vault-approval-posture-telegram-id-dm.test.ts +191 -0
package/telegram-plugin/uat/scenarios/vault-audit-allow-dm.test.ts +108 -0
package/telegram-plugin/uat/scenarios/vault-grant-auto-resume-dm.test.ts +121 -0
package/telegram-plugin/uat/scenarios/vault-request-access-concurrent-dm.test.ts +161 -0
package/telegram-plugin/uat/scenarios/vault-request-access-end-to-end-dm.test.ts +158 -0
package/telegram-plugin/uat/scenarios/voice-inbound-dm.test.ts +65 -0
package/telegram-plugin/vault-approval-posture.ts +42 -0
package/telegram-plugin/welcome-text.ts +1 -0
package/telegram-plugin/active-pins-sweep.ts +0 -204
package/telegram-plugin/active-pins.ts +0 -146
package/telegram-plugin/auth-dashboard.ts +0 -1104
package/telegram-plugin/auth-slot-parser.ts +0 -497
package/telegram-plugin/card-event-log.ts +0 -138
package/telegram-plugin/dist/foreman/foreman.js +0 -31106
package/telegram-plugin/docs/multi-agent-card-design.md +0 -847
package/telegram-plugin/docs/pinned-progress-card-reliability.md +0 -144
package/telegram-plugin/foreman/foreman-create-flow.ts +0 -202
package/telegram-plugin/foreman/foreman-handlers.ts +0 -493
package/telegram-plugin/foreman/foreman.ts +0 -1165
package/telegram-plugin/foreman/setup-flow.ts +0 -345
package/telegram-plugin/foreman/setup-state.ts +0 -239
package/telegram-plugin/foreman/state.ts +0 -203
package/telegram-plugin/pin-event-log.ts +0 -76
package/telegram-plugin/progress-card-driver.ts +0 -2886
package/telegram-plugin/progress-card-pin-manager.ts +0 -589
package/telegram-plugin/progress-card-pin-watchdog.ts +0 -98
package/telegram-plugin/progress-card.ts +0 -1409
package/telegram-plugin/tests/HARNESS.md +0 -340
package/telegram-plugin/tests/_progress-card-harness.ts +0 -109
package/telegram-plugin/tests/active-pins-boot-reaper.test.ts +0 -211
package/telegram-plugin/tests/active-pins-sweep.test.ts +0 -309
package/telegram-plugin/tests/active-pins.test.ts +0 -187
package/telegram-plugin/tests/auth-account-identity-surface.test.ts +0 -118
package/telegram-plugin/tests/auth-dashboard-edge-cases.test.ts +0 -260
package/telegram-plugin/tests/auth-dashboard-restart-flow.test.ts +0 -140
package/telegram-plugin/tests/auth-dashboard-v3b.test.ts +0 -559
package/telegram-plugin/tests/auth-dashboard.test.ts +0 -1045
package/telegram-plugin/tests/auth-slot-commands.test.ts +0 -640
package/telegram-plugin/tests/bg-agent-progress-card-757.test.ts +0 -201
package/telegram-plugin/tests/boot-card-account-quota.test.ts +0 -137
package/telegram-plugin/tests/card-event-log.test.ts +0 -145
package/telegram-plugin/tests/first-paint.test.ts +0 -257
package/telegram-plugin/tests/foreman-create-flow.test.ts +0 -359
package/telegram-plugin/tests/foreman-handlers.test.ts +0 -347
package/telegram-plugin/tests/foreman-state.test.ts +0 -164
package/telegram-plugin/tests/foreman-write-ops.test.ts +0 -214
package/telegram-plugin/tests/harness-ordering-invariants.test.ts +0 -243
package/telegram-plugin/tests/pin-event-log.test.ts +0 -124
package/telegram-plugin/tests/progress-card-api-failure-during-deferred.test.ts +0 -73
package/telegram-plugin/tests/progress-card-close-paths-converge.test.ts +0 -272
package/telegram-plugin/tests/progress-card-cross-turn.test.ts +0 -258
package/telegram-plugin/tests/progress-card-delay-842.test.ts +0 -160
package/telegram-plugin/tests/progress-card-dispose-preservepending.test.ts +0 -81
package/telegram-plugin/tests/progress-card-draft-flag.test.ts +0 -80
package/telegram-plugin/tests/progress-card-driver-eviction.test.ts +0 -215
package/telegram-plugin/tests/progress-card-driver-fleet-shadow.test.ts +0 -123
package/telegram-plugin/tests/progress-card-driver-force-complete-parent-done.test.ts +0 -76
package/telegram-plugin/tests/progress-card-edit-timestamps-budget.test.ts +0 -62
package/telegram-plugin/tests/progress-card-memory-bounds.test.ts +0 -84
package/telegram-plugin/tests/progress-card-pin-failure-paths.test.ts +0 -139
package/telegram-plugin/tests/progress-card-pin-manager.test.ts +0 -773
package/telegram-plugin/tests/progress-card-pin-race-fast-turn.test.ts +0 -66
package/telegram-plugin/tests/progress-card-pin-sidecar-partial-write.test.ts +0 -64
package/telegram-plugin/tests/progress-card-pin-watchdog.test.ts +0 -190
package/telegram-plugin/tests/progress-card-sigterm-pin-flush.test.ts +0 -146
package/telegram-plugin/tests/real-gateway-f1-ladder-integrity.test.ts +0 -123
package/telegram-plugin/tests/real-gateway-f2-instant-draft.test.ts +0 -82
package/telegram-plugin/tests/real-gateway-f3-late-card.test.ts +0 -114
package/telegram-plugin/tests/real-gateway-harness.ts +0 -699
package/telegram-plugin/tests/real-gateway-i6-turn-flush-replay-dedup.test.ts +0 -313
package/telegram-plugin/tests/real-gateway-ipc-lifecycle.test.ts +0 -299
package/telegram-plugin/tests/real-gateway-spec.test.ts +0 -487
package/telegram-plugin/tests/real-gateway.smoke.test.ts +0 -101
package/telegram-plugin/tests/setup-flow.test.ts +0 -510
package/telegram-plugin/tests/setup-state.test.ts +0 -146
package/telegram-plugin/tests/sync-chat-running-subagents.test.ts +0 -116
package/telegram-plugin/tests/turn-end-regressions.test.ts +0 -489
package/telegram-plugin/tests/turn-flush-card-takeover.test.ts +0 -218
package/telegram-plugin/tests/turn-flush-prose-recovery.test.ts +0 -78
package/telegram-plugin/tests/two-zone-bg-carry-full-lifecycle.test.ts +0 -131
package/telegram-plugin/tests/two-zone-bg-detection.test.ts +0 -120
package/telegram-plugin/tests/two-zone-bg-done-when-all-terminal.test.ts +0 -116
package/telegram-plugin/tests/two-zone-bg-early-turn-end.test.ts +0 -87
package/telegram-plugin/tests/two-zone-bg-survives-next-turn.test.ts +0 -211
package/telegram-plugin/tests/two-zone-card-cap.test.ts +0 -62
package/telegram-plugin/tests/two-zone-card-fleet-row.test.ts +0 -101
package/telegram-plugin/tests/two-zone-card-header-phases.test.ts +0 -78
package/telegram-plugin/tests/two-zone-card-html-balance.test.ts +0 -110
package/telegram-plugin/tests/two-zone-card-lifecycle.test.ts +0 -128
package/telegram-plugin/tests/two-zone-card-sanitise.test.ts +0 -58
package/telegram-plugin/tests/two-zone-card-snapshot.test.ts +0 -133
package/telegram-plugin/tests/two-zone-concurrent-turns-isolation.test.ts +0 -155
package/telegram-plugin/tests/two-zone-phasefor-precedence.test.ts +0 -117
package/telegram-plugin/tests/two-zone-snapshot-extras.test.ts +0 -187
package/telegram-plugin/tests/two-zone-stuck-edit-throttle.test.ts +0 -149
package/telegram-plugin/tests/two-zone-stuck-header-escalation.test.ts +0 -101
package/telegram-plugin/tests/two-zone-stuck-per-member.test.ts +0 -114
package/telegram-plugin/tests/two-zone-stuck-recovery.test.ts +0 -105
package/telegram-plugin/tests/waiting-ux-harness.ts +0 -381
package/telegram-plugin/tests/waiting-ux.e2e.test.ts +0 -233
package/telegram-plugin/turn-flush-prose-recovery.ts +0 -40
package/telegram-plugin/two-zone-card.ts +0 -269
package/telegram-plugin/uat/scenarios/smoke-clerk-reply.test.ts +0 -61

package/telegram-plugin/tests/sandbox-hint-posttool.test.ts ADDED Viewed

@@ -0,0 +1,155 @@
+/**
+ * Tests for the sandbox-hint-posttool hook (Layer 2 of the sandbox UX work).
+ *
+ * Hook contract:
+ *   stdin:  PostToolUse JSON event { tool_name, tool_response, ... }
+ *   stdout: optional JSON
+ *             {"hookSpecificOutput":{"hookEventName":"PostToolUse",
+ *              "additionalContext":"..."}}
+ *   exit:   0 always.
+ *
+ * Tests spawn the hook as a subprocess (mirroring how Claude Code invokes
+ * it), feed a tool_response, and assert whether additionalContext was
+ * emitted and that it carries the load-bearing strings the agent needs.
+ */
+import { describe, it, expect } from 'bun:test'
+import { join } from 'path'
+import { spawnSync } from 'child_process'
+const HOOK_SCRIPT = join(import.meta.dir, '..', 'hooks', 'sandbox-hint-posttool.mjs')
+function runHook(event: object) {
+  const result = spawnSync(process.execPath, [HOOK_SCRIPT], {
+    input: JSON.stringify(event),
+    encoding: 'utf8',
+    env: process.env,
+    timeout: 5_000,
+  })
+  return result
+}
+function parseContext(stdout: string): string | null {
+  if (!stdout.trim()) return null
+  const parsed = JSON.parse(stdout)
+  return parsed?.hookSpecificOutput?.additionalContext ?? null
+}
+describe('sandbox-hint-posttool', () => {
+  it('emits sandbox hint when tool_response contains EROFS', () => {
+    const result = runHook({
+      tool_name: 'Write',
+      tool_use_id: 'toolu_001',
+      tool_response: {
+        error: "EROFS: read-only file system, open '/opt/switchroom/skills/foo.md'",
+      },
+    })
+    expect(result.status).toBe(0)
+    const ctx = parseContext(result.stdout)
+    expect(ctx).not.toBeNull()
+    expect(ctx).toContain('Sandbox boundary hit')
+    expect(ctx).toContain('operator action')
+    expect(ctx).toContain('Writable paths')
+  })
+  it('emits sandbox hint when tool_response contains "Read-only file system"', () => {
+    const result = runHook({
+      tool_name: 'Edit',
+      tool_use_id: 'toolu_002',
+      tool_response: 'mkdir: cannot create directory: Read-only file system',
+    })
+    expect(result.status).toBe(0)
+    const ctx = parseContext(result.stdout)
+    expect(ctx).toContain('Sandbox boundary hit')
+  })
+  it('emits an apt-specific hint when tool_response shows dpkg permission denied', () => {
+    const result = runHook({
+      tool_name: 'Bash',
+      tool_use_id: 'toolu_003',
+      tool_response: {
+        stderr:
+          'E: Unable to acquire the dpkg frontend lock (/var/lib/dpkg/lock-frontend), are you root?',
+      },
+    })
+    expect(result.status).toBe(0)
+    const ctx = parseContext(result.stdout)
+    expect(ctx).toContain('docker/Dockerfile.agent')
+    expect(ctx).toContain('rebuild')
+  })
+  it('emits a hint for EACCES on a rootfs path', () => {
+    const result = runHook({
+      tool_name: 'Bash',
+      tool_use_id: 'toolu_004',
+      tool_response: 'npm ERR! EACCES: permission denied, mkdir "/usr/lib/node_modules/foo"',
+    })
+    expect(result.status).toBe(0)
+    const ctx = parseContext(result.stdout)
+    expect(ctx).toContain('Sandbox boundary hit')
+  })
+  it('emits nothing when tool_response is a normal success', () => {
+    const result = runHook({
+      tool_name: 'Bash',
+      tool_use_id: 'toolu_005',
+      tool_response: { stdout: 'hello world\n', exit_code: 0 },
+    })
+    expect(result.status).toBe(0)
+    expect(result.stdout.trim()).toBe('')
+  })
+  it('emits nothing when tool_response merely mentions /usr but is not a sandbox error', () => {
+    // Guard against false positives — the agent may legitimately discuss
+    // paths under /usr in normal output (e.g. `which node` returning
+    // /usr/local/bin/node). Only EACCES / EROFS patterns should trigger.
+    const result = runHook({
+      tool_name: 'Bash',
+      tool_use_id: 'toolu_006',
+      tool_response: { stdout: '/usr/local/bin/node\n' },
+    })
+    expect(result.status).toBe(0)
+    expect(result.stdout.trim()).toBe('')
+  })
+  it('exits 0 on malformed stdin without crashing', () => {
+    const result = spawnSync(process.execPath, [HOOK_SCRIPT], {
+      input: 'not json at all',
+      encoding: 'utf8',
+      timeout: 5_000,
+    })
+    expect(result.status).toBe(0)
+    expect(result.stdout.trim()).toBe('')
+  })
+  it('exits 0 on empty stdin', () => {
+    const result = spawnSync(process.execPath, [HOOK_SCRIPT], {
+      input: '',
+      encoding: 'utf8',
+      timeout: 5_000,
+    })
+    expect(result.status).toBe(0)
+    expect(result.stdout.trim()).toBe('')
+  })
+  it('caps the scan window for huge tool_response payloads', () => {
+    // 100 KiB of harmless output followed by an EROFS — we cap at 64 KiB
+    // so this should NOT match. Keeps a runaway tool_response from
+    // pinning the hook on a regex scan.
+    const huge = 'x'.repeat(100 * 1024) + ' EROFS happened'
+    const result = runHook({
+      tool_name: 'Bash',
+      tool_use_id: 'toolu_007',
+      tool_response: { stdout: huge },
+    })
+    expect(result.status).toBe(0)
+    expect(result.stdout.trim()).toBe('')
+  })
+})

package/telegram-plugin/tests/secret-detect-delete-must-surface-failures.test.ts ADDED Viewed

@@ -0,0 +1,133 @@
+/**
+ * TDD-RED-first contract for the silent-delete-failure class the
+ * operator reported on 2026-05-12.
+ *
+ * Symptom: "🔒 captured a secret. we deleted it from chat" lands as
+ * a reply, but the raw secret-bearing message remains visible in
+ * chat history. The operator only finds out by scrolling, after
+ * the secret has already been screen-shot / cached / synced to
+ * other devices.
+ *
+ * Root cause: every secret-detect call site that invokes
+ * `bot.api.deleteMessage(chat_id, msgId)` does it via a raw
+ * `try { … } catch { … }` block that silently swallows the error
+ * (or, at best, logs to stderr — invisible to the operator). The
+ * gateway already has a `deleteSensitiveMessage(chat_id, msgId,
+ * reason)` helper that does the right thing — try delete, surface
+ * loudly on failure with an in-chat warning naming the message id
+ * the operator must delete manually. The four secret-detect sites
+ * weren't migrated when that helper was added (#44).
+ *
+ * The fix is mechanical: replace each `try { bot.api.deleteMessage
+ * } catch { }` in the secret-detect path with
+ * `deleteSensitiveMessage`. That's what this test pins.
+ *
+ * Failing means: at least one secret-detect path still has a raw
+ * `bot.api.deleteMessage` call wrapped in a swallow-catch — a
+ * regression of the silent-failure bug.
+ */
+import { describe, it, expect } from "vitest";
+import { readFileSync } from "node:fs";
+import { resolve } from "node:path";
+const gatewaySrc = readFileSync(
+  resolve(__dirname, "..", "gateway", "gateway.ts"),
+  "utf-8",
+);
+/** Slice the gateway source between two anchor strings. */
+function sliceBetween(src: string, from: string, to: string): string {
+  const start = src.indexOf(from);
+  if (start < 0) return "";
+  const end = src.indexOf(to, start);
+  return src.slice(start, end > 0 ? end : src.length);
+}
+describe("secret-detect — delete failures must NOT be silently swallowed (2026-05-12)", () => {
+  // The secret-detect block lives inside `handleInbound`. It runs
+  // through several branches:
+  //   - passphrase cached + high-confidence hit (stored path)
+  //   - passphrase cached + Channel-B auth-flow fallback
+  //   - no-passphrase deferred path
+  //   - pipeline-error fail-closed path
+  //
+  // Each branch deletes the raw message. None of them may use the
+  // raw `bot.api.deleteMessage` pattern wrapped in a swallow-catch
+  // — they must all route through `deleteSensitiveMessage` which
+  // surfaces failures via stderr + in-chat warning.
+  const secretDetectBlock = sliceBetween(
+    gatewaySrc,
+    "FAIL-CLOSED: if the pipeline throws",
+    "Status reaction controller",
+  );
+  it("the secret-detect block exists and is non-trivial (anchor sanity)", () => {
+    // fails when: the anchors above are renamed/moved. If this fails,
+    // update the anchors AND audit the other assertions in this file
+    // to make sure they still target the secret-detect path.
+    expect(secretDetectBlock.length).toBeGreaterThan(500);
+  });
+  it("no raw `bot.api.deleteMessage` calls inside the secret-detect block", () => {
+    // fails when: a code site reverts to the raw API call (which
+    // swallows on failure). All deletes here MUST route through the
+    // shared helper.
+    expect(secretDetectBlock).not.toMatch(/bot\.api\.deleteMessage/);
+  });
+  it("every delete in the secret-detect block goes through deleteSensitiveMessage", () => {
+    // The block currently performs deletes for four distinct cases
+    // (stored / auth-flow-fallback / deferred / pipeline-error). All
+    // four MUST land here.
+    //
+    // fails when: a refactor extracts one of the branches into a
+    // helper that doesn't use deleteSensitiveMessage, OR when a new
+    // branch is added without the helper. Either way the contract
+    // breaks.
+    const callMatches = secretDetectBlock.match(/deleteSensitiveMessage\s*\(/g) ?? [];
+    expect(
+      callMatches.length,
+      `expected ≥3 deleteSensitiveMessage calls inside the secret-detect block; got ${callMatches.length}`,
+    ).toBeGreaterThanOrEqual(3);
+  });
+  it("no swallow-catch pattern around delete calls in the secret-detect block", () => {
+    // The legacy pattern: `try { await bot.api.deleteMessage(...) } catch {}`
+    // OR `try { ... } catch { /* swallow */ }`. The helper handles
+    // failure surfacing, so call sites should NOT wrap the helper
+    // in another silencing catch.
+    //
+    // fails when: a refactor wraps the helper call in `try { ... } catch {}`
+    // for "robustness" — which would re-introduce the silent-failure
+    // class this PR exists to close.
+    expect(secretDetectBlock).not.toMatch(/try\s*\{[^}]*deleteSensitiveMessage[^}]*\}\s*catch\s*\{\s*\}/s);
+    // Also forbid the raw `try { bot.api.deleteMessage ... } catch {}` shape.
+    expect(secretDetectBlock).not.toMatch(/try\s*\{[^}]*bot\.api\.deleteMessage[^}]*\}\s*catch/s);
+  });
+});
+describe("secret-detect — deleteSensitiveMessage helper retains its 'surface failures' contract", () => {
+  // The fix only works if the helper itself surfaces failures.
+  // Pin the helper's load-bearing behavior so a future refactor
+  // can't quietly turn it into a silent-catch.
+  const helperBody = sliceBetween(
+    gatewaySrc,
+    "async function deleteSensitiveMessage",
+    "function getCommandArgs",
+  );
+  it("helper logs to stderr on delete failure", () => {
+    expect(helperBody).toMatch(/process\.stderr\.write/);
+    expect(helperBody).toMatch(/SECURITY:.*FAILED/);
+  });
+  it("helper posts an in-chat warning naming the leaked message id", () => {
+    // The warning is the only signal a mobile-only operator gets —
+    // stderr is invisible to them. Pinning the in-chat surface as
+    // the load-bearing piece.
+    expect(helperBody).toMatch(/sendMessage/);
+    expect(helperBody).toMatch(/delete message.*manually|delete it manually|manually|delete message <code>/i);
+  });
+});

package/telegram-plugin/tests/secret-detect-false-positives.test.ts ADDED Viewed

@@ -0,0 +1,137 @@
+/**
+ * TDD-RED-first contract tests for the false-positive class the
+ * operator reported on 2026-05-12.
+ *
+ * Symptom: casual chat that MENTIONS the words "secret", "token",
+ * "password", or an ALLCAPS *_KEY/_TOKEN/_SECRET identifier triggers
+ * the redaction pipeline as if the user just pasted a real credential
+ * — original message gets deleted, ambiguous-card lands, the operator
+ * has to dismiss it. Worst case: the operator is asking the agent
+ * *about* a secret ("delete the secret I sent yesterday") and gets
+ * stuck in a redaction-of-the-question loop.
+ *
+ * The pre-fix `env_key_value` pattern in patterns.ts:71 is the
+ * load-bearing culprit:
+ *
+ *   /\b([A-Z0-9_]*(?:KEY|TOKEN|SECRET|PASSWORD|PASSWD))\b\s*[=:]\s*
+ *     (["']?)([^\s"'\\]+)\2/g
+ *
+ * It matches ANY value after `SECRET=` / `TOKEN=` with no entropy
+ * gate, no length floor, no shape check on the value. Trivially fires
+ * on `SECRET=foo`, `MY_KEY=bar`, even `FATSECRET=hello`.
+ *
+ * The pre-fix `kv_entropy` pattern in kv-scanner.ts:30 has a 4.0
+ * entropy gate which catches some — but `kv_entropy` is the
+ * lower-confidence layer and doesn't run when the higher-confidence
+ * `env_key_value` already fired. Tightening env_key_value is the
+ * right place to land the fix.
+ *
+ * Each test is the contract: detection MUST NOT fire on the listed
+ * input. Failing means the pipeline still flags the input as a hit.
+ * The fix adds an entropy + length floor to env_key_value to match
+ * the existing kv_entropy precedent.
+ */
+import { describe, it, expect } from "vitest";
+import { detectSecrets } from "../secret-detect/index.js";
+describe("secret-detect — does NOT fire on casual mentions of 'secret' / 'token' / 'password'", () => {
+  // The "operator asking the agent about a secret" cases.
+  // Pre-fix: env_key_value matches "SECRET=" anywhere; these were
+  // tripping. Post-fix: entropy + length gate on the value.
+  it.each([
+    [
+      "operator asks for a secret by name",
+      "what's my fatsecret token?",
+    ],
+    [
+      "operator references a deleted prior message",
+      "please delete that secret you sent earlier",
+    ],
+    [
+      "agent name contains 'secret' as a substring (FatSecret API)",
+      "the FatSecret API needs an OAuth token — can you wire it up?",
+    ],
+    [
+      "human language sentence with 'password' as a noun",
+      "I keep forgetting my password again",
+    ],
+    [
+      "fragment that mentions an env var by name but no value",
+      "the FATSECRET_TOKEN env var is missing",
+    ],
+    [
+      "code-shaped placeholder, value is human-readable English",
+      "set FOO_SECRET=hello and try again",
+    ],
+    [
+      "shell example with placeholder value (test fixture style)",
+      "run: export OPENAI_API_KEY=sk-yourkey",
+    ],
+  ])("%s — %j", (_label, text) => {
+    const hits = detectSecrets(text);
+    expect(
+      hits,
+      `false positive on ${JSON.stringify(text)} — hits=${JSON.stringify(hits.map((h) => h.matched_text))}`,
+    ).toEqual([]);
+  });
+});
+describe("secret-detect — DOES still fire on actually-shaped secrets (regression guard)", () => {
+  // After tightening env_key_value, these MUST still be caught.
+  // Locking in so a future regex-tightening doesn't over-shoot.
+  // Values constructed at runtime so the source file doesn't trip
+  // GitHub Push Protection — same pattern as
+  // secret-detect-secretlint.test.ts:1.
+  const fakeApiKey = `sk-ant-${"a1b2c3d4".repeat(4)}XYZ987`; // sk-ant- + 32 chars
+  const fakeBearer = `${"abc123".repeat(8)}.${"def456".repeat(4)}`;
+  const fakeRandom = `${"x9zM4kP3qR7sT2vW".repeat(2)}`; // 32 chars, high entropy
+  it.each([
+    [
+      "real-shaped Anthropic API key (anchored prefix path)",
+      `export ANTHROPIC_API_KEY=${fakeApiKey}`,
+    ],
+    [
+      "real-shaped Bearer token (anchored Bearer path)",
+      `Authorization: Bearer ${fakeBearer}`,
+    ],
+    [
+      "uppercase env_key_value with high-entropy value (must still match)",
+      `MYAPP_API_KEY=${fakeRandom}`,
+    ],
+  ])("%s — %j", (_label, text) => {
+    const hits = detectSecrets(text);
+    expect(
+      hits.length,
+      `regression: expected a hit on ${JSON.stringify(text)} but pipeline returned 0`,
+    ).toBeGreaterThanOrEqual(1);
+  });
+});
+describe("secret-detect — boundary cases that pin the fix's shape", () => {
+  it("short low-entropy value after KEY= is NOT flagged", () => {
+    // pre-fix: matches; post-fix: filtered by entropy/length gate.
+    expect(detectSecrets("MY_API_KEY=foo")).toEqual([]);
+  });
+  it("English word after KEY= is NOT flagged", () => {
+    expect(detectSecrets("MY_TOKEN=hello")).toEqual([]);
+  });
+  it("long but low-entropy value after KEY= is NOT flagged (repeating chars)", () => {
+    // 32 chars but all 'a' — Shannon entropy ~0. Real secrets are
+    // dense; this is template/placeholder shape.
+    expect(detectSecrets(`MY_KEY=${"a".repeat(32)}`)).toEqual([]);
+  });
+  it("high-entropy value after KEY= IS flagged (the fix doesn't break detection)", () => {
+    // 32 chars of base64-ish noise. Should match.
+    const hits = detectSecrets(
+      // Build the value via concat to avoid Push-Protection trip on a
+      // contiguous secret-shaped literal.
+      `MY_API_KEY=${"k" + "9zMpQrT2vBxYuFnGwL8cHj"}`,
+    );
+    expect(hits.length).toBeGreaterThanOrEqual(1);
+  });
+});