npm - switchroom - Versions diffs - 0.15.44 → 0.16.4 - Mend

switchroom 0.15.44 → 0.16.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (150) hide show

package/dist/agent-scheduler/index.js +122 -88
package/dist/auth-broker/index.js +463 -177
package/dist/cli/autoaccept-poll.js +4842 -35
package/dist/cli/drive-write-pretool.mjs +17 -14
package/dist/cli/notion-write-pretool.mjs +117 -86
package/dist/cli/self-improve-apply-guard-pretool.mjs +626 -0
package/dist/cli/self-improve-stop.mjs +428 -0
package/dist/cli/skill-validate-pretool.mjs +72 -72
package/dist/cli/switchroom.js +3249 -1241
package/dist/cli/ui/index.html +1 -1
package/dist/host-control/main.js +2833 -355
package/dist/vault/approvals/kernel-server.js +7482 -7439
package/dist/vault/broker/server.js +11315 -11272
package/examples/minimal.yaml +1 -0
package/examples/switchroom.yaml +1 -0
package/package.json +3 -3
package/profiles/_base/start.sh.hbs +88 -1
package/profiles/_shared/execution-discipline.md.hbs +18 -0
package/profiles/default/CLAUDE.md.hbs +3 -22
package/telegram-plugin/.claude-plugin/plugin.json +2 -2
package/telegram-plugin/answer-stream-flag.ts +12 -49
package/telegram-plugin/answer-stream.ts +5 -150
package/telegram-plugin/auth-snapshot-format.ts +280 -48
package/telegram-plugin/auto-fallback-fleet.ts +44 -1
package/telegram-plugin/context-exhaustion.ts +12 -0
package/telegram-plugin/demo-mask.ts +154 -0
package/telegram-plugin/dist/bridge/bridge.js +167 -124
package/telegram-plugin/dist/gateway/gateway.js +3039 -1159
package/telegram-plugin/dist/server.js +215 -172
package/telegram-plugin/docs/waiting-ux-spec.md +2 -2
package/telegram-plugin/draft-stream.ts +47 -410
package/telegram-plugin/final-answer-detect.ts +17 -12
package/telegram-plugin/fleet-fallback-resume.ts +131 -0
package/telegram-plugin/format.ts +56 -19
package/telegram-plugin/gateway/auth-add-flow.ts +332 -127
package/telegram-plugin/gateway/auth-broker-client.ts +2 -2
package/telegram-plugin/gateway/auth-command.ts +70 -14
package/telegram-plugin/gateway/clean-shutdown-marker.ts +44 -0
package/telegram-plugin/gateway/config-approval-handler.test.ts +91 -4
package/telegram-plugin/gateway/config-approval-handler.ts +94 -13
package/telegram-plugin/gateway/current-turn-map.ts +188 -0
package/telegram-plugin/gateway/disconnect-flush.ts +3 -1
package/telegram-plugin/gateway/effort-command.ts +8 -3
package/telegram-plugin/gateway/emission-authority.ts +369 -0
package/telegram-plugin/gateway/feed-open-gate.ts +292 -0
package/telegram-plugin/gateway/gateway.ts +1837 -291
package/telegram-plugin/gateway/inject-handler.test.ts +2 -1
package/telegram-plugin/gateway/ms365-write-approval.test.ts +4 -4
package/telegram-plugin/gateway/represent-guard.ts +72 -0
package/telegram-plugin/gateway/status-surface-log.test.ts +5 -4
package/telegram-plugin/gateway/status-surface-log.ts +14 -3
package/telegram-plugin/history.ts +33 -11
package/telegram-plugin/hooks/repo-context-pretool.mjs +26 -0
package/telegram-plugin/hooks/subagent-tracker-posttool.mjs +5 -0
package/telegram-plugin/hooks/subagent-tracker-pretool.mjs +8 -0
package/telegram-plugin/hooks/tool-label-pretool.mjs +39 -15
package/telegram-plugin/issues-card.ts +4 -0
package/telegram-plugin/model-unavailable.ts +124 -0
package/telegram-plugin/narrative-dedup.ts +69 -0
package/telegram-plugin/over-ping-safety-net.ts +70 -4
package/telegram-plugin/package.json +3 -3
package/telegram-plugin/pending-work-progress.ts +12 -0
package/telegram-plugin/permission-rule.ts +32 -5
package/telegram-plugin/permission-title.ts +152 -9
package/telegram-plugin/quota-check.ts +13 -0
package/telegram-plugin/quota-watch.ts +135 -7
package/telegram-plugin/registry/turns-schema.test.ts +24 -0
package/telegram-plugin/registry/turns-schema.ts +9 -0
package/telegram-plugin/runtime-metrics.ts +13 -0
package/telegram-plugin/session-tail.ts +96 -11
package/telegram-plugin/silence-poke.ts +170 -24
package/telegram-plugin/slot-banner-driver.ts +3 -0
package/telegram-plugin/status-no-truncate.ts +44 -0
package/telegram-plugin/status-reactions.ts +20 -3
package/telegram-plugin/stream-controller.ts +4 -23
package/telegram-plugin/stream-reply-handler.ts +6 -24
package/telegram-plugin/streaming-metrics.ts +91 -0
package/telegram-plugin/subagent-watcher.ts +212 -66
package/telegram-plugin/tests/activity-ever-opened-sticky.test.ts +47 -0
package/telegram-plugin/tests/answer-stream-dedup.test.ts +9 -26
package/telegram-plugin/tests/answer-stream-flag.test.ts +25 -58
package/telegram-plugin/tests/answer-stream-silent-markers.test.ts +41 -51
package/telegram-plugin/tests/answer-stream.test.ts +2 -411
package/telegram-plugin/tests/auth-add-flow.test.ts +488 -253
package/telegram-plugin/tests/auth-command-format2.test.ts +71 -1
package/telegram-plugin/tests/auth-snapshot-format.test.ts +376 -6
package/telegram-plugin/tests/auto-fallback-fleet.test.ts +120 -0
package/telegram-plugin/tests/cross-turn-card-gate.test.ts +424 -0
package/telegram-plugin/tests/demo-mask.test.ts +127 -0
package/telegram-plugin/tests/draft-stream.test.ts +0 -827
package/telegram-plugin/tests/emission-authority-card-drain-gate.test.ts +236 -0
package/telegram-plugin/tests/emission-authority-facade.test.ts +488 -0
package/telegram-plugin/tests/emission-authority-open-gate.test.ts +179 -0
package/telegram-plugin/tests/emission-authority-ping-gate.test.ts +395 -0
package/telegram-plugin/tests/emission-determinism-wiring.test.ts +177 -0
package/telegram-plugin/tests/feed-heartbeat-liveness-open.test.ts +146 -0
package/telegram-plugin/tests/feed-open-gate.test.ts +259 -0
package/telegram-plugin/tests/feed-survival.test.ts +526 -0
package/telegram-plugin/tests/fleet-fallback-resume.test.ts +197 -0
package/telegram-plugin/tests/gateway-clean-shutdown-marker.test.ts +117 -0
package/telegram-plugin/tests/gateway-no-reply-single-emit.test.ts +4 -11
package/telegram-plugin/tests/history.test.ts +60 -0
package/telegram-plugin/tests/model-unavailable.test.ts +118 -0
package/telegram-plugin/tests/narrative-dedup.test.ts +118 -0
package/telegram-plugin/tests/orphaned-reply-rearm.test.ts +285 -0
package/telegram-plugin/tests/over-ping-final-answer-decoupling.test.ts +194 -0
package/telegram-plugin/tests/over-ping-safety-net.test.ts +2 -2
package/telegram-plugin/tests/per-topic-current-turn.test.ts +373 -0
package/telegram-plugin/tests/permission-card-origin-kill-switch.test.ts +42 -0
package/telegram-plugin/tests/permission-rule.test.ts +17 -0
package/telegram-plugin/tests/permission-title.test.ts +206 -17
package/telegram-plugin/tests/quota-watch.test.ts +252 -9
package/telegram-plugin/tests/reply-terminal-reaction.test.ts +6 -1
package/telegram-plugin/tests/repo-context-pretool.test.ts +62 -0
package/telegram-plugin/tests/represent-guard.test.ts +162 -0
package/telegram-plugin/tests/session-tail.test.ts +147 -3
package/telegram-plugin/tests/silence-liveness-wiring.test.ts +18 -0
package/telegram-plugin/tests/status-card-budget-parity.test.ts +72 -0
package/telegram-plugin/tests/status-surface-log.test.ts +146 -0
package/telegram-plugin/tests/subagent-watcher-clip-narrative.test.ts +58 -0
package/telegram-plugin/tests/subagent-watcher-parent-turn-key.test.ts +102 -0
package/telegram-plugin/tests/subagent-watcher-workflow-visibility.test.ts +225 -0
package/telegram-plugin/tests/subagent-watcher.test.ts +147 -0
package/telegram-plugin/tests/telegram-activity-visibility-integration.test.ts +597 -0
package/telegram-plugin/tests/telegram-format.test.ts +101 -6
package/telegram-plugin/tests/tool-activity-summary.test.ts +550 -15
package/telegram-plugin/tests/tool-label-pretool.test.ts +73 -0
package/telegram-plugin/tests/tool-label-sidecar.test.ts +44 -0
package/telegram-plugin/tests/tool-labels.test.ts +67 -0
package/telegram-plugin/tests/turn-liveness-floor.test.ts +196 -0
package/telegram-plugin/tests/turn-liveness-invariant.test.ts +340 -0
package/telegram-plugin/tests/welcome-text.test.ts +32 -3
package/telegram-plugin/tests/worker-activity-feed.test.ts +470 -22
package/telegram-plugin/tool-activity-summary.ts +375 -58
package/telegram-plugin/turn-liveness-floor.ts +240 -0
package/telegram-plugin/uat/assertions.ts +115 -0
package/telegram-plugin/uat/driver.ts +68 -0
package/telegram-plugin/uat/scenarios/bg-sub-agent-dispatch-dm.test.ts +119 -133
package/telegram-plugin/uat/scenarios/jtbd-answer-pings.test.ts +94 -0
package/telegram-plugin/uat/scenarios/jtbd-cross-turn-card-dm.test.ts +109 -0
package/telegram-plugin/uat/scenarios/jtbd-foreground-feed-thinkgap-dm.test.ts +478 -0
package/telegram-plugin/uat/scenarios/jtbd-foreground-feed-visibility-dm.test.ts +396 -0
package/telegram-plugin/uat/scenarios/jtbd-liveness-feed-open-dm.test.ts +202 -0
package/telegram-plugin/uat/scenarios/jtbd-reply-is-last-dm.test.ts +202 -0
package/telegram-plugin/uat/scenarios/reactions-dm.test.ts +93 -87
package/telegram-plugin/welcome-text.ts +13 -1
package/telegram-plugin/worker-activity-feed.ts +157 -82
package/telegram-plugin/draft-transport.ts +0 -122
package/telegram-plugin/tests/draft-retirement-wiring.test.ts +0 -82
package/telegram-plugin/tests/draft-transport.test.ts +0 -211

package/telegram-plugin/tests/worker-activity-feed.test.ts CHANGED Viewed

@@ -6,6 +6,7 @@ import {
   type WorkerActivityView,
   type BotApiForWorkerFeed,
 } from '../worker-activity-feed.js'
+import { STATUS_ROLLING_LINES, STATUS_LINE_MAX } from '../status-no-truncate.js'
 describe('isWorkerActivityFeedEnabled (default ON)', () => {
   it('defaults to true when the env var is unset', () => {
@@ -75,7 +76,8 @@ describe('renderWorkerActivity', () => {
   it('renders the native header + running status + step feed', () => {
     const out = renderWorkerActivity(view())
     expect(out).toContain('🛠 <b>Worker</b> · <i>research competitors</i>')
-    expect(out).toContain('running · ')
+    // Unified header: running shows "<elapsed> · N tools" (no "running ·" word).
+    expect(out).toContain('<i>10s · 3 tools</i>')
     expect(out).toContain('3 tools')
     // No narrativeLines → the latestSummary surfaces as the newest `→` step.
     expect(out).toContain('<b>→ scanning vendor pages</b>')
@@ -108,20 +110,41 @@ describe('renderWorkerActivity', () => {
       view({ state: 'done', toolCount: 5, latestSummary: 'PR #21 opened' }),
     )
     expect(out).toContain('🛠 <b>Worker</b> · <i>research competitors</i>')
-    expect(out).toContain('finished · completed · 5 tools · ')
+    // Unified done header: "done · N tools · <elapsed>".
+    expect(out).toContain('<i>done · 5 tools · ')
     expect(out).toContain('─────')
     expect(out).toContain('✅ <i>PR #21 opened</i>')
+    // latestSummary is the RESULT on the finished path, never also a step.
+    expect(out).not.toContain('<i>✓ PR #21 opened</i>')
   })
   it('renders a failed terminal recap', () => {
     const out = renderWorkerActivity(view({ state: 'failed', latestSummary: 'blew up' }))
-    expect(out).toContain('finished · failed · ')
+    // The header word reflects the failure (`failed · …`) AND the ⚠️ result
+    // block carries the detail — the two signals are complementary.
+    expect(out).toContain('<i>failed · ')
+    expect(out).not.toContain('<i>done · ')
     expect(out).toContain('⚠️ <i>blew up</i>')
   })
+  it('a failed worker with EMPTY result is never byte-identical to a done worker (regression: #2553 failure-honesty)', () => {
+    // Detail-less terminal error: resultText === '' (subagent-watcher path).
+    const failed = renderWorkerActivity(view({ state: 'failed', latestSummary: '' }))
+    const done = renderWorkerActivity(view({ state: 'done', latestSummary: '' }))
+    // (a) The two renders must differ — the failure signal cannot vanish.
+    expect(failed).not.toBe(done)
+    // (b) The failed render carries a visible failure marker even with no
+    //     result block (the `failed` header word and/or the ⚠️ emoji).
+    expect(failed.includes('failed') || failed.includes('⚠️')).toBe(true)
+    expect(failed).toContain('<i>failed · ')
+    // The done render must NOT read as failed.
+    expect(done).toContain('<i>done · ')
+    expect(done).not.toContain('failed')
+  })
   it('omits the rule + result line when the terminal result is empty', () => {
     const out = renderWorkerActivity(view({ state: 'done', latestSummary: '   ' }))
-    expect(out).toContain('finished · completed · ')
+    expect(out).toContain('<i>done · ')
     expect(out).not.toContain('─────')
   })
@@ -153,15 +176,17 @@ describe('renderWorkerActivity', () => {
     expect(stepCount(out)).toBe(2)
   })
-  it('shows an overflow header when the feed exceeds the cap', () => {
-    const lines = Array.from({ length: 9 }, (_, i) => `step ${i + 1}`)
+  it('shows a "+N earlier…" header when the feed exceeds STATUS_ROLLING_LINES (worker surface)', () => {
+    const total = STATUS_ROLLING_LINES + 3
+    const lines = Array.from({ length: total }, (_, i) => `step ${i + 1}`)
     const out = renderWorkerActivity(view({ narrativeLines: lines }))
-    expect(out).toContain('<i>✓ +3 earlier…</i>')
-    expect(out).not.toContain('step 1')
-    expect(out).toContain('<i>✓ step 4</i>')
-    expect(out).toContain('<b>→ step 9</b>')
-    // 6 visible step lines (the overflow header is not itself a step).
-    expect(out.match(/step \d/g) ?? []).toHaveLength(6)
+    expect(out).toContain(`<i>✓ +${total - STATUS_ROLLING_LINES} earlier…</i>`)
+    expect(out).not.toContain('step 1<')
+    const firstVisible = total - STATUS_ROLLING_LINES + 1
+    expect(out).toContain(`<i>✓ step ${firstVisible}</i>`)
+    expect(out).toContain(`<b>→ step ${total}</b>`)
+    // STATUS_ROLLING_LINES visible step lines (the overflow header isn't a step).
+    expect(out.match(/step \d/g) ?? []).toHaveLength(STATUS_ROLLING_LINES)
   })
   it('strips Markdown markup from narrative + description + result', () => {
@@ -278,7 +303,7 @@ describe('createWorkerActivityFeed', () => {
     clock = 10_500 // well within the throttle window
     await feed.finish('w1', view({ state: 'done', toolCount: 5 }))
     expect(bot.edits).toHaveLength(1)
-    expect(bot.edits[0].text).toContain('finished · completed · 5 tools')
+    expect(bot.edits[0].text).toContain('<i>done · 5 tools · ')
     // finish forgets the worker.
     expect(feed.has('w1')).toBe(false)
     expect(feed.size).toBe(0)
@@ -391,23 +416,22 @@ describe('createWorkerActivityFeed', () => {
     expect(last.text.match(/[✓→]/g) ?? []).toHaveLength(1)
   })
-  it('caps the narrative block to the last 6 lines', async () => {
+  it('rolls the narrative block to the last STATUS_ROLLING_LINES lines', async () => {
     const bot = makeFakeBot()
     let clock = 10_000
     const feed = createWorkerActivityFeed({ bot, now: () => clock, minEditIntervalMs: 0 })
-    for (let i = 1; i <= 9; i++) {
+    const total = 9
+    for (let i = 1; i <= total; i++) {
       clock += 1000
-      await feed.update('w1', 'chat', view({ toolCount: i, latestSummary: `line ${i}` }))
+      await feed.update('w1', 'chat', view({ toolCount: i, latestSummary: `ln-${String(i).padStart(3, '0')}` }))
     }
     const last = bot.edits.at(-1)!
-    expect(last.text.match(/[✓→]/g) ?? []).toHaveLength(6)
-    // Oldest lines evicted; newest retained.
-    expect(last.text).not.toContain('line 1')
-    expect(last.text).not.toContain('line 3')
-    expect(last.text).toContain('line 4')
-    expect(last.text).toContain('line 9')
+    expect(last.text.match(/[✓→]/g) ?? []).toHaveLength(STATUS_ROLLING_LINES)
+    const firstVisible = total - STATUS_ROLLING_LINES + 1
+    for (let i = 1; i < firstVisible; i++) expect(last.text).not.toContain(`ln-${String(i).padStart(3, '0')}`)
+    for (let i = firstVisible; i <= total; i++) expect(last.text).toContain(`ln-${String(i).padStart(3, '0')}`)
   })
   it('grows the narrative even while throttled (line surfaces on next edit)', async () => {
@@ -501,3 +525,427 @@ describe('createWorkerActivityFeed — log sink', () => {
     expect(logs.some((l) => l.startsWith('worker-feed: paint'))).toBe(false)
   })
 })
+// ─── Rolling window + STATUS_LINE_MAX (flag retired) ─────────────────────────
+// Single mode: last STATUS_ROLLING_LINES lines render in full (clipped per-line
+// at STATUS_LINE_MAX=200), overflow → `+N earlier…` header on the worker surface,
+// char-budget backstop is the only wire-limit ceiling.
+describe('rolling window + STATUS_LINE_MAX — renderWorkerActivity', () => {
+  it('with 12 narrative lines, exactly the last STATUS_ROLLING_LINES render + a +N earlier header', () => {
+    const narrativeLines = Array.from({ length: 12 }, (_, i) => `stp-${String(i + 1).padStart(3, '0')}`)
+    const out = renderWorkerActivity(view({ narrativeLines }))
+    const firstVisible = 12 - STATUS_ROLLING_LINES + 1
+    for (let i = firstVisible; i <= 12; i++) {
+      expect(out).toContain(`stp-${String(i).padStart(3, '0')}`)
+    }
+    for (let i = 1; i < firstVisible; i++) {
+      expect(out).not.toContain(`stp-${String(i).padStart(3, '0')}`)
+    }
+    // Overflow header now appears on the worker surface too.
+    expect(out).toContain(`<i>✓ +${12 - STATUS_ROLLING_LINES} earlier…</i>`)
+    expect(out).toContain('<b>→ stp-012</b>')
+  })
+  it('STATUS_LINE_MAX=200: a 250-char line is clipped to 200 with a trailing …', () => {
+    const longLine = 'a'.repeat(250)
+    const out = renderWorkerActivity(view({ narrativeLines: [longLine] }))
+    expect(out).toContain('…')
+    expect(out).not.toContain(longLine)
+    expect(out).toContain('a'.repeat(STATUS_LINE_MAX - 1) + '…')
+  })
+  it('a line at exactly STATUS_LINE_MAX is NOT clipped', () => {
+    const exact = 'b'.repeat(STATUS_LINE_MAX)
+    const out = renderWorkerActivity(view({ narrativeLines: [exact] }))
+    expect(out).toContain(exact)
+    expect(out).not.toContain('…')
+  })
+  it('no "+N earlier…" overflow header when the feed fits the window', () => {
+    const narrativeLines = Array.from({ length: STATUS_ROLLING_LINES }, (_, i) => `step ${i + 1}`)
+    const out = renderWorkerActivity(view({ narrativeLines }))
+    expect(out).not.toContain('earlier…')
+  })
+  it('pathologically oversized body: char-budget backstop fires, output ≤ 4096 chars', () => {
+    const bigLine = 'z'.repeat(900)
+    const narrativeLines = Array.from({ length: STATUS_ROLLING_LINES }, () => bigLine)
+    const out = renderWorkerActivity(view({ narrativeLines }))
+    expect(out.length).toBeLessThanOrEqual(4096)
+    const hasBullet = out.includes('→') || out.includes('✓')
+    expect(hasBullet).toBe(true)
+  })
+})
+describe('rolling window — createWorkerActivityFeed narrative accumulation', () => {
+  it('with 12 pushes, only the last STATUS_ROLLING_LINES appear in the render', async () => {
+    const bot = makeFakeBot()
+    let clock = 10_000
+    const feed = createWorkerActivityFeed({ bot, now: () => clock, minEditIntervalMs: 0 })
+    for (let i = 1; i <= 12; i++) {
+      clock += 1000
+      await feed.update('w1', 'chat', view({ toolCount: i, latestSummary: `ln-${String(i).padStart(3, '0')}` }))
+    }
+    const last = bot.edits.at(-1)!
+    const firstVisible = 12 - STATUS_ROLLING_LINES + 1
+    for (let i = firstVisible; i <= 12; i++) {
+      expect(last.text).toContain(`ln-${String(i).padStart(3, '0')}`)
+    }
+    for (let i = 1; i < firstVisible; i++) {
+      expect(last.text).not.toContain(`ln-${String(i).padStart(3, '0')}`)
+    }
+    // The manager caps the in-memory narrative at STATUS_ROLLING_LINES, so the
+    // render never sees overflow — no "+N earlier…" marker on the manager path
+    // (it surfaces only on direct renderWorkerActivity calls with >5 lines).
+    expect(last.text).not.toContain('earlier…')
+    expect(last.text).toContain('<b>→ ln-012</b>')
+  })
+})
+// ─── Worker heartbeat (option a — suffix-only, never opens a new message) ─────
+describe('createWorkerActivityFeed — heartbeat', () => {
+  it('(i) a tick fires a re-render with a climbing · Ns suffix on a stale worker', async () => {
+    const bot = makeFakeBot()
+    let clock = 10_000
+    const feed = createWorkerActivityFeed({
+      bot,
+      now: () => clock,
+      minEditIntervalMs: 2500,
+      heartbeatTickMs: 6000,
+      // No real timer: drive ticks manually.
+      setInterval: () => 1,
+      clearInterval: () => {},
+    })
+    // First paint at elapsed 0 (firstPaintMin default 8000 — use 9000).
+    clock = 19_000
+    await feed.update('w1', 'chat', view({ elapsedMs: 9000, latestSummary: 'pulling data' }))
+    expect(bot.sent).toHaveLength(1)
+    const dispatchAt = clock - 9000
+    // Advance past the staleness window so the heartbeat ticks.
+    clock = 26_000 // lastEditAt(19000) + 7000 ≥ heartbeatTickMs(6000) and ≥ minEditInterval
+    feed.heartbeatTick()
+    await feed.update('w1', 'chat', view({ elapsedMs: 16_000, latestSummary: 'pulling data' })).catch(() => {})
+    // Drain the chain.
+    await feed.update('w1', 'chat', view({ elapsedMs: 16_000, latestSummary: 'pulling data' }))
+    const edit1 = bot.edits.find((e) => /· \d+s<\/b>/.test(e.text))
+    expect(edit1).toBeDefined()
+    // The suffix reflects the LIVE elapsed (now - dispatchAt), not the stale view.
+    expect(edit1!.text).toContain(`· ${Math.floor((26_000 - dispatchAt) / 1000)}s`)
+  })
+  it('(ii) respects a 429 cooldown — no edit while cooldownUntil is in the future', async () => {
+    const bot = makeFakeBot()
+    let clock = 10_000
+    const feed = createWorkerActivityFeed({
+      bot,
+      now: () => clock,
+      minEditIntervalMs: 0,
+      heartbeatTickMs: 6000,
+      firstPaintMinMs: 0,
+      setInterval: () => 1,
+      clearInterval: () => {},
+    })
+    await feed.update('w1', 'chat', view({ elapsedMs: 1000, latestSummary: 'go' }))
+    expect(bot.sent).toHaveLength(1)
+    // Induce a cooldown by failing the next edit with a 429.
+    clock = 20_000
+    bot.failNextEditWith = { error_code: 429, parameters: { retry_after: 30 } }
+    await feed.update('w1', 'chat', view({ elapsedMs: 11_000, latestSummary: 'changed' }))
+    const editsAfterCooldown = bot.edits.length
+    // Tick while still inside the cooldown window → no new edit.
+    clock = 27_000
+    feed.heartbeatTick()
+    await feed.update('w1', 'chat', view({ elapsedMs: 18_000, latestSummary: 'changed' }))
+    expect(bot.edits.length).toBe(editsAfterCooldown)
+  })
+  it('(iii) does not edit after the handle is removed on finish', async () => {
+    const bot = makeFakeBot()
+    let clock = 10_000
+    const feed = createWorkerActivityFeed({
+      bot,
+      now: () => clock,
+      minEditIntervalMs: 0,
+      heartbeatTickMs: 6000,
+      setInterval: () => 1,
+      clearInterval: () => {},
+    })
+    await feed.update('w1', 'chat', view({ latestSummary: 'go' }))
+    clock = 20_000
+    await feed.finish('w1', view({ state: 'done', toolCount: 2 }))
+    expect(feed.has('w1')).toBe(false)
+    const editsBefore = bot.edits.length
+    clock = 30_000
+    feed.heartbeatTick()
+    // No handle → tick is a no-op, no further edit.
+    expect(bot.edits.length).toBe(editsBefore)
+  })
+  it('(iv) stop() clears the interval and a tick on empty handles is a no-op (no leak)', () => {
+    let cleared = false
+    const bot = makeFakeBot()
+    let clock = 10_000
+    const feed = createWorkerActivityFeed({
+      bot,
+      now: () => clock,
+      setInterval: () => 1,
+      clearInterval: () => { cleared = true },
+    })
+    // No handles yet → tick does nothing and does not throw.
+    expect(() => feed.heartbeatTick()).not.toThrow()
+    feed.stop()
+    expect(cleared).toBe(true)
+  })
+  it('(v) respects minEditInterval — a tick inside the throttle window does not edit', async () => {
+    const bot = makeFakeBot()
+    let clock = 10_000
+    const feed = createWorkerActivityFeed({
+      bot,
+      now: () => clock,
+      minEditIntervalMs: 2500,
+      heartbeatTickMs: 6000,
+      firstPaintMinMs: 0,
+      setInterval: () => 1,
+      clearInterval: () => {},
+    })
+    await feed.update('w1', 'chat', view({ elapsedMs: 1000, latestSummary: 'go' }))
+    expect(bot.sent).toHaveLength(1)
+    const editsBefore = bot.edits.length
+    // Tick only 1000ms after the paint — inside minEditInterval (2500) → no edit.
+    clock = 11_000
+    feed.heartbeatTick()
+    await feed.update('w1', 'chat', view({ elapsedMs: 2000, latestSummary: 'go' })).catch(() => {})
+    expect(bot.edits.length).toBe(editsBefore)
+  })
+})
+// ─── Extreme-edge: single oversized narrative line (no-truncate ON) ──────────
+// Reproduces the bug where accumulateNarrative's char-budget splice would push
+// the oversized line then immediately splice it out, making the narrative empty
+// and the step vanish from the rendered output.
+/**
+ * Cheap valid-HTML checker: balanced <b>/<i> tags and no dangling/partial entity.
+ * Checks for partial entities (e.g. `&am`, `&l`, `&amp` without trailing `;`)
+ * as produced by naive slicing of already-escaped HTML at an entity boundary.
+ */
+function isValidWorkerHtml(s: string): boolean {
+  const bOpen = (s.match(/<b>/g) ?? []).length
+  const bClose = (s.match(/<\/b>/g) ?? []).length
+  const iOpen = (s.match(/<i>/g) ?? []).length
+  const iClose = (s.match(/<\/i>/g) ?? []).length
+  if (bOpen !== bClose || iOpen !== iClose) return false
+  // Check every `&` occurrence: the run of letters after it must end with `;`.
+  // A partial entity like `&am`, `&l`, or `&amp` (no ;) would fail this.
+  // We scan every `&` manually so there's no regex backtracking ambiguity.
+  for (let i = 0; i < s.length; i++) {
+    if (s[i] !== '&') continue
+    let j = i + 1
+    while (j < s.length && s[j] >= 'a' && s[j] <= 'z') j++
+    // j is now at the character after the letter run.
+    // If there were letters and the next char isn't ';', it's a broken entity.
+    if (j > i + 1 && (j >= s.length || s[j] !== ';')) return false
+  }
+  return true
+}
+describe('extreme-edge: single oversized narrative line (no-truncate ON)', () => {
+  it('no-truncate ON: one ~4100-char step is shown (truncated) not discarded, output ≤ budget and valid HTML', async () => {
+    const bot = makeFakeBot()
+    let clock = 10_000
+    const feed = createWorkerActivityFeed({ bot, now: () => clock, minEditIntervalMs: 0 })
+    // Build a latestSummary > STATUS_CARD_CHAR_BUDGET chars with && and special chars.
+    const base = 'run build && deploy && notify with <args> & flags=1 '
+    const hugeStep = base.repeat(80) + '&&'
+    expect(hugeStep.length).toBeGreaterThan(4000)
+    await feed.update('w1', 'chat', view({ toolCount: 1, latestSummary: hugeStep }))
+    expect(bot.sent).toHaveLength(1)
+    const out = bot.sent[0].text
+    // The step must NOT have vanished — some portion must appear.
+    // Since the step is huge it will be truncated, but the worker card itself
+    // must contain a step bullet (→ or ✓).
+    const hasBullet = out.includes('→') || out.includes('✓')
+    expect(hasBullet).toBe(true)
+    // Wire safety: output must be within the Telegram char budget.
+    expect(out.length).toBeLessThanOrEqual(4096)
+    // Valid HTML: balanced tags and no partial entity.
+    expect(isValidWorkerHtml(out)).toBe(true)
+  })
+  it('no-truncate ON: one ~4100-char step via renderWorkerActivity directly → ≤ budget and valid HTML', () => {
+    const base = 'compile && link && package && ship: action=deploy env=<prod> flag=1 '
+    const hugeStep = base.repeat(65)
+    expect(hugeStep.length).toBeGreaterThan(4000)
+    const out = renderWorkerActivity(view({ narrativeLines: [hugeStep] }))
+    // Step must be present in some form (truncated is fine, absent is not).
+    const hasBullet = out.includes('→') || out.includes('✓')
+    expect(hasBullet).toBe(true)
+    expect(out.length).toBeLessThanOrEqual(4096)
+    expect(isValidWorkerHtml(out)).toBe(true)
+  })
+})
+// ─── Bug 2: _fitWorkerBodyToCharBudget must not slice already-escaped HTML ───
+//
+// Before the fix, the extreme fallback in _fitWorkerBodyToCharBudget sliced
+// directly into the already-HTML-escaped newest line string. If the slice
+// boundary landed inside an HTML entity (&amp;, &lt;, &gt;), the output
+// contained a broken entity fragment (&am, &l, &amp without ;), which
+// Telegram Bot API rejects with HTTP 400 on parse_mode:'HTML'.
+//
+// The fix mirrors _fitToCharBudget (tool-activity-summary.ts): truncate RAW
+// content first, then escape, then wrap, re-checking post-escape because
+// escaping can expand the string (&→&amp; etc.).
+//
+// These tests place entity characters (&, <, >) at positions that, under the
+// old naive slice, would produce exactly the broken fragments the issue
+// identified (&am, &l). They assert the output is valid HTML and within budget.
+describe('Bug 2 (#2506): _fitWorkerBodyToCharBudget does not split HTML entities', () => {
+  /**
+   * Build a narrative line that, after HTML-escaping, has the entity boundary
+   * at a precise position so a naive `escaped.slice(3, 3 + N)` would split it.
+   *
+   * Strategy: fill with 'x' characters up to a budget, then append an entity
+   * character so the entity starts right where the slice would land.
+   */
+  function buildEntityBoundaryLine(entityChar: string, charBudget: number): string {
+    // The fitter computes sliceAt ≈ charBudget - tagOverhead - closingTag.length.
+    // After the "→ " prefix (2 chars) and <b>…</b> wrapper (7 chars total overhead
+    // in the old code), the inner slice window is roughly charBudget - 9.
+    // Place the entity character so it lands at the very start of where the
+    // naive slice would begin — i.e., fill with (charBudget - 9) 'x's then '&'.
+    const fillLen = Math.max(0, charBudget - 9)
+    return 'x'.repeat(fillLen) + entityChar + 'y'.repeat(50)
+  }
+  it('& at entity boundary: output is valid HTML (no &am, &amp without ; etc.)', () => {
+    // A line that places '&' right at the slice boundary so naive cut → &am
+    const line = buildEntityBoundaryLine('&', 4096)
+    expect(line.length).toBeGreaterThan(100) // sanity: line is substantial
+    const out = renderWorkerActivity(view({ narrativeLines: [line] }))
+    expect(out.length).toBeLessThanOrEqual(4096)
+    expect(isValidWorkerHtml(out)).toBe(true)
+    // No partial entity fragments that the old code produced.
+    expect(out).not.toMatch(/&amp$/)   // incomplete &amp; at end
+    expect(out).not.toMatch(/&am[^p]/) // &am followed by non-p (e.g. &amy)
+    expect(out).not.toMatch(/&[lg]t?[^;]/) // &l, &lt without semicolon
+  })
+  it('< at entity boundary: output is valid HTML (no &l, &lt without ; etc.)', () => {
+    const line = buildEntityBoundaryLine('<', 4096)
+    const out = renderWorkerActivity(view({ narrativeLines: [line] }))
+    expect(out.length).toBeLessThanOrEqual(4096)
+    expect(isValidWorkerHtml(out)).toBe(true)
+    expect(out).not.toMatch(/&lt$/)    // incomplete &lt; at end
+    expect(out).not.toMatch(/&l[^t;]/) // &l followed by non-t
+  })
+  it('> at entity boundary: output is valid HTML (no &g, &gt without ; etc.)', () => {
+    const line = buildEntityBoundaryLine('>', 4096)
+    const out = renderWorkerActivity(view({ narrativeLines: [line] }))
+    expect(out.length).toBeLessThanOrEqual(4096)
+    expect(isValidWorkerHtml(out)).toBe(true)
+    expect(out).not.toMatch(/&gt$/)    // incomplete &gt; at end
+    expect(out).not.toMatch(/&g[^t;]/) // &g followed by non-t
+  })
+  it('entity-dense line (& < > interleaved): output ≤ budget and valid HTML', () => {
+    // Mix entity characters throughout so any slice position is dangerous.
+    const chunk = '&' + 'x'.repeat(3) + '<' + 'y'.repeat(3) + '>' + 'z'.repeat(3)
+    const line = chunk.repeat(500) // ~10k chars raw → well over budget after escape
+    expect(line.length).toBeGreaterThan(4000)
+    const out = renderWorkerActivity(view({ narrativeLines: [line] }))
+    expect(out.length).toBeLessThanOrEqual(4096)
+    expect(isValidWorkerHtml(out)).toBe(true)
+  })
+  it('single & alone in the line: valid HTML and within budget', () => {
+    // Regression: a one-char entity line is a degenerate case the while-loop
+    // must handle without infinite-looping or returning empty content.
+    // Build a huge line: filler xs then '&' then more xs
+    const line = 'x'.repeat(3000) + '&' + 'x'.repeat(1000)
+    expect(line.length).toBeGreaterThan(4000)
+    const out = renderWorkerActivity(view({ narrativeLines: [line] }))
+    expect(out.length).toBeLessThanOrEqual(4096)
+    expect(isValidWorkerHtml(out)).toBe(true)
+  })
+})
+// ─── Regression: header/status row + rolling overflow survive trimming ───────
+//
+// The unified renderer clips every line to STATUS_LINE_MAX (200) BEFORE the
+// char-budget backstop, so ordinary "long step" turns fit the budget without
+// dropping any bullets. The two-line header always survives, and a rolling
+// "+N earlier…" marker appears when more than STATUS_ROLLING_LINES lines are
+// rendered directly. The char-budget backstop (fitCardToBudget) is exercised
+// only by genuinely pathological single oversized lines (covered elsewhere).
+describe('header row + rolling overflow survive in the unified worker render', () => {
+  it('the two-line header survives even with many long lines (clipped to STATUS_LINE_MAX)', () => {
+    const bigLine = 'a'.repeat(700)
+    const narrativeLines = Array.from({ length: 6 }, (_, i) =>
+      i < 5 ? bigLine : 'final short step',
+    )
+    const out = renderWorkerActivity(view({ narrativeLines, toolCount: 7 }))
+    expect(out).toContain('🛠 <b>Worker</b>')
+    // Unified running status line.
+    expect(out).toContain('<i>10s · 7 tools</i>')
+    expect(out).toContain('7 tools')
+    // Every rendered line was clipped to STATUS_LINE_MAX → output well within budget.
+    expect(out.length).toBeLessThanOrEqual(4096)
+    // Newest bullet is the live → step.
+    expect(out).toContain('<b>→ final short step</b>')
+  })
+  it('a "+N earlier…" rolling marker appears when more than STATUS_ROLLING_LINES lines render', () => {
+    const narrativeLines = Array.from({ length: STATUS_ROLLING_LINES + 2 }, (_, i) => `step ${i + 1}`)
+    const out = renderWorkerActivity(view({ narrativeLines }))
+    expect(out.length).toBeLessThanOrEqual(4096)
+    expect(out).toContain('earlier…')
+    expect(out).toContain('🛠 <b>Worker</b>')
+    expect(out).toContain('<i>10s · ')
+  })
+  it('back-compat path (latestSummary only) still shows a step bullet, clipped + valid HTML', () => {
+    const hugeSummary = 'deploy service && run migrations && verify health checks '.repeat(80)
+    expect(hugeSummary.length).toBeGreaterThan(4000)
+    const out = renderWorkerActivity(
+      view({ narrativeLines: undefined, latestSummary: hugeSummary }),
+    )
+    expect(out.length).toBeLessThanOrEqual(4096)
+    const hasBullet = out.includes('→') || out.includes('✓')
+    expect(hasBullet).toBe(true)
+    expect(out).toContain('🛠 <b>Worker</b>')
+    expect(out).toContain('<i>10s · ')
+    expect(isValidWorkerHtml(out)).toBe(true)
+  })
+})