npm - switchroom - Versions diffs - 0.12.26 → 0.12.28 - Mend

switchroom 0.12.26 → 0.12.28

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

package/dist/agent-scheduler/index.js +80 -80
package/dist/auth-broker/index.js +80 -80
package/dist/cli/drive-write-pretool.mjs +10 -10
package/dist/cli/skill-validate-pretool.mjs +72 -72
package/dist/cli/switchroom.js +359 -357
package/dist/host-control/main.js +99 -99
package/dist/vault/approvals/kernel-server.js +82 -82
package/dist/vault/broker/server.js +83 -83
package/package.json +2 -1
package/telegram-plugin/dist/bridge/bridge.js +112 -112
package/telegram-plugin/dist/gateway/gateway.js +368 -209
package/telegram-plugin/dist/server.js +160 -160
package/telegram-plugin/gateway/gateway.ts +55 -40
package/telegram-plugin/gateway/inbound-delivery-machine-dispatch.ts +188 -0
package/telegram-plugin/stderr-timestamps.ts +106 -0
package/telegram-plugin/tests/inbound-delivery-machine-dispatch.test.ts +240 -0
package/telegram-plugin/tests/stderr-timestamps.test.ts +113 -0
package/vendor/hindsight-memory/.claude-plugin/plugin.json +8 -0
package/vendor/hindsight-memory/CHANGELOG.md +32 -0
package/vendor/hindsight-memory/LICENSE +21 -0
package/vendor/hindsight-memory/README.md +329 -0
package/vendor/hindsight-memory/hooks/hooks.json +49 -0
package/vendor/hindsight-memory/scripts/drain_pending.py +190 -0
package/vendor/hindsight-memory/scripts/lib/__init__.py +0 -0
package/vendor/hindsight-memory/scripts/lib/bank.py +122 -0
package/vendor/hindsight-memory/scripts/lib/client.py +204 -0
package/vendor/hindsight-memory/scripts/lib/config.py +180 -0
package/vendor/hindsight-memory/scripts/lib/content.py +493 -0
package/vendor/hindsight-memory/scripts/lib/daemon.py +334 -0
package/vendor/hindsight-memory/scripts/lib/directives.py +119 -0
package/vendor/hindsight-memory/scripts/lib/gateway_ipc.py +126 -0
package/vendor/hindsight-memory/scripts/lib/llm.py +146 -0
package/vendor/hindsight-memory/scripts/lib/pending.py +218 -0
package/vendor/hindsight-memory/scripts/lib/state.py +196 -0
package/vendor/hindsight-memory/scripts/recall.py +873 -0
package/vendor/hindsight-memory/scripts/retain.py +286 -0
package/vendor/hindsight-memory/scripts/session_end.py +122 -0
package/vendor/hindsight-memory/scripts/session_start.py +76 -0
package/vendor/hindsight-memory/scripts/setup_hooks.py +115 -0
package/vendor/hindsight-memory/scripts/tests/__init__.py +0 -0
package/vendor/hindsight-memory/scripts/tests/test_directives.py +211 -0
package/vendor/hindsight-memory/scripts/tests/test_gateway_ipc.py +205 -0
package/vendor/hindsight-memory/scripts/tests/test_recall_integration.py +621 -0
package/vendor/hindsight-memory/settings.json +37 -0
package/vendor/hindsight-memory/skills/setup.md +24 -0
package/vendor/hindsight-memory/tests/conftest.py +94 -0
package/vendor/hindsight-memory/tests/test_bank.py +142 -0
package/vendor/hindsight-memory/tests/test_client.py +232 -0
package/vendor/hindsight-memory/tests/test_config.py +128 -0
package/vendor/hindsight-memory/tests/test_content.py +471 -0
package/vendor/hindsight-memory/tests/test_drain_pending.py +192 -0
package/vendor/hindsight-memory/tests/test_hooks.py +808 -0
package/vendor/hindsight-memory/tests/test_manifest.py +14 -0
package/vendor/hindsight-memory/tests/test_pending.py +152 -0
package/vendor/hindsight-memory/tests/test_recall_exit_codes.py +325 -0
package/vendor/hindsight-memory/tests/test_session_end_pending.py +205 -0
package/vendor/hindsight-memory/tests/test_state.py +125 -0

package/vendor/hindsight-memory/tests/test_manifest.py ADDED Viewed

@@ -0,0 +1,14 @@
+"""Validate that JSON manifests are strict-valid JSON (no trailing commas, etc.)."""
+import json
+from pathlib import Path
+INTEGRATION_ROOT = Path(__file__).resolve().parent.parent
+def test_hooks_json_is_valid():
+    path = INTEGRATION_ROOT / "hooks" / "hooks.json"
+    raw = path.read_text()
+    parsed = json.loads(raw)
+    assert "hooks" in parsed
+    assert isinstance(parsed["hooks"], dict)

package/vendor/hindsight-memory/tests/test_pending.py ADDED Viewed

@@ -0,0 +1,152 @@
+"""Tests for the pending-retains persistent queue (#1071)."""
+import json
+import os
+import sys
+import time
+import unittest
+from unittest.mock import patch
+SCRIPTS_DIR = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "scripts"))
+if SCRIPTS_DIR not in sys.path:
+    sys.path.insert(0, SCRIPTS_DIR)
+import lib.pending as pending_mod  # noqa: E402
+class PendingQueueTest(unittest.TestCase):
+    def setUp(self):
+        # Use a temp dir scoped per-test so concurrent runs don't
+        # collide. The module reads HINDSIGHT_PENDING_DIR on every call,
+        # not at import time — no reload needed.
+        import tempfile
+        self._tmp = tempfile.mkdtemp(prefix="hindsight-pending-test-")
+        self._dir = os.path.join(self._tmp, "pending-retains")
+        os.environ["HINDSIGHT_PENDING_DIR"] = self._dir
+    def tearDown(self):
+        import shutil
+        shutil.rmtree(self._tmp, ignore_errors=True)
+        os.environ.pop("HINDSIGHT_PENDING_DIR", None)
+    def _sample_payload(self, document_id: str = "doc-1") -> dict:
+        return {
+            "api_url": "http://fake:9077",
+            "api_token": None,
+            "bank_id": "test-bank",
+            "content": "user: hello\nassistant: hi",
+            "document_id": document_id,
+            "context": "claude-code",
+            "metadata": {"session_id": "sess-1"},
+            "tags": None,
+        }
+    def test_enqueue_creates_dir_with_mode_0700(self):
+        self.assertFalse(os.path.isdir(self._dir))
+        pending_mod.enqueue(self._sample_payload(), RuntimeError("boom"))
+        self.assertTrue(os.path.isdir(self._dir))
+        mode = os.stat(self._dir).st_mode & 0o777
+        self.assertEqual(mode, 0o700)
+    def test_enqueue_writes_payload_and_error_metadata(self):
+        path = pending_mod.enqueue(self._sample_payload(), ValueError("nope"))
+        self.assertIsNotNone(path)
+        self.assertTrue(os.path.isfile(path))
+        with open(path) as f:
+            entry = json.load(f)
+        self.assertEqual(entry["bank_id"], "test-bank")
+        self.assertEqual(entry["content"], "user: hello\nassistant: hi")
+        self.assertEqual(entry["document_id"], "doc-1")
+        self.assertEqual(entry["error_class"], "ValueError")
+        self.assertEqual(entry["error_message"], "nope")
+        self.assertEqual(entry["attempt_count"], 1)
+        self.assertIn("failed_at", entry)
+        self.assertEqual(entry["schema"], pending_mod.SCHEMA)
+    def test_enqueue_filename_is_unix_ms_uuid(self):
+        path = pending_mod.enqueue(self._sample_payload(), RuntimeError("boom"))
+        name = os.path.basename(path)
+        self.assertTrue(name.endswith(".json"))
+        head = name[: -len(".json")]
+        ts_part, uuid_part = head.split("-", 1)
+        self.assertTrue(ts_part.isdigit())
+        # Filename ts should be within 10 s of now
+        now_ms = int(time.time() * 1000)
+        self.assertLess(abs(now_ms - int(ts_part)), 10_000)
+        self.assertEqual(len(uuid_part), 12)
+    def test_enqueue_atomic_no_tmp_left_behind(self):
+        pending_mod.enqueue(self._sample_payload(), RuntimeError("boom"))
+        names = sorted(os.listdir(self._dir))
+        self.assertEqual(len(names), 1)
+        self.assertFalse(any(n.endswith(".tmp") for n in names))
+    def test_enqueue_returns_none_when_full(self):
+        # Pre-populate with MAX_ENTRIES dummy files.
+        os.makedirs(self._dir, mode=0o700)
+        for i in range(pending_mod.MAX_ENTRIES):
+            with open(os.path.join(self._dir, f"{i:013d}-aaaaaaaaaaaa.json"), "w") as f:
+                json.dump({"placeholder": True}, f)
+        result = pending_mod.enqueue(self._sample_payload(), RuntimeError("boom"))
+        self.assertIsNone(result)
+        # Count unchanged
+        self.assertEqual(pending_mod.count(), pending_mod.MAX_ENTRIES)
+    def test_iter_entries_ordered_oldest_first(self):
+        p1 = pending_mod.enqueue(self._sample_payload("doc-1"), RuntimeError("e1"))
+        time.sleep(0.005)
+        p2 = pending_mod.enqueue(self._sample_payload("doc-2"), RuntimeError("e2"))
+        time.sleep(0.005)
+        p3 = pending_mod.enqueue(self._sample_payload("doc-3"), RuntimeError("e3"))
+        entries = pending_mod.iter_entries()
+        paths = [e[0] for e in entries]
+        self.assertEqual(paths, [p1, p2, p3])
+    def test_iter_entries_skips_malformed(self):
+        os.makedirs(self._dir, mode=0o700)
+        # Good
+        good = pending_mod.enqueue(self._sample_payload(), RuntimeError("ok"))
+        # Bad (not JSON)
+        with open(os.path.join(self._dir, f"{int(time.time() * 1000) + 1}-bad.json"), "w") as f:
+            f.write("not json")
+        entries = pending_mod.iter_entries()
+        paths = [e[0] for e in entries]
+        self.assertIn(good, paths)
+        # The bad file is skipped, not raised
+        self.assertEqual(len(entries), 1)
+    def test_update_attempt_bumps_count_atomically(self):
+        path = pending_mod.enqueue(self._sample_payload(), RuntimeError("first"))
+        entries = pending_mod.iter_entries()
+        _, entry = entries[0]
+        self.assertEqual(entry["attempt_count"], 1)
+        ok = pending_mod.update_attempt(path, entry, RuntimeError("second"))
+        self.assertTrue(ok)
+        with open(path) as f:
+            reread = json.load(f)
+        self.assertEqual(reread["attempt_count"], 2)
+        self.assertEqual(reread["error_message"], "second")
+        self.assertIn("last_attempt_at", reread)
+    def test_mark_dead_renames_to_dot_dead(self):
+        path = pending_mod.enqueue(self._sample_payload(), RuntimeError("boom"))
+        entries = pending_mod.iter_entries()
+        _, entry = entries[0]
+        dead = pending_mod.mark_dead(path, entry)
+        self.assertTrue(dead.endswith(".dead"))
+        self.assertFalse(os.path.exists(path))
+        self.assertTrue(os.path.isfile(dead))
+        with open(dead) as f:
+            reread = json.load(f)
+        self.assertIn("dead_at", reread)
+        # iter_entries no longer surfaces .dead files
+        self.assertEqual(pending_mod.iter_entries(), [])
+    def test_count_safe_when_dir_missing(self):
+        self.assertEqual(pending_mod.count(), 0)
+if __name__ == "__main__":
+    unittest.main()

package/vendor/hindsight-memory/tests/test_recall_exit_codes.py ADDED Viewed

@@ -0,0 +1,325 @@
+"""Exit-code contract for recall.py's top-level exception handler.
+Switchroom #1070 (redo per #1085 review feedback).
+The original fix changed non-debug uncaught exceptions to exit 2,
+assuming `bin/run-hook.sh`'s `record_failure` path would fire. But
+recall.py is registered as a DIRECT Claude Code plugin hook
+(`vendor/hindsight-memory/hooks/hooks.json`), not wrapped. Per Claude
+Code's `UserPromptSubmit` hook contract, exit 2 blocks the user's
+prompt and surfaces stderr to them — so a hindsight outage would
+block every turn.
+The corrected contract pinned by these tests:
+* Non-debug uncaught exception → exit code 0 (agent stays responsive),
+  empty stdout (matches the no-memories success-path shape), stderr
+  carrying the class + message but NOT a traceback, AND a synchronous
+  shell-out to `switchroom issues record --severity warn --source
+  hindsight.recall --code recall_failed ...` so the #424 issue-sink
+  still captures the outage.
+* The shell-out is fault-tolerant: if the `switchroom` binary is
+  missing, hangs, or exits non-zero, recall.py still exits 0 with the
+  safe stdout shape.
+* Stderr / issue-sink detail are passed through an inline secret
+  redactor (bearer tokens, ?token=…/&api_key=… query-string creds,
+  x-api-key headers) so credentials leaking out of `lib/client.py:73`'s
+  `RuntimeError(f"HTTP {e.code} from {url}: ...")` don't land in
+  journald or the issues store.
+* Debug uncaught exception (HINDSIGHT_DEBUG=1) → exit code 2 with
+  full traceback. Unchanged — live-debugging operators opt in.
+The fault is injected by monkey-patching a helper called during
+``main()`` so the top-level except handler fires. We run the script
+as a subprocess so the real ``if __name__ == '__main__':`` block
+executes.
+"""
+import json
+import os
+import subprocess
+import sys
+import textwrap
+SCRIPTS_DIR = os.path.abspath(
+    os.path.join(os.path.dirname(__file__), "..", "scripts")
+)
+RECALL_PY = os.path.join(SCRIPTS_DIR, "recall.py")
+def _run_recall_with_injected_fault(
+    tmp_path,
+    debug=False,
+    fault_message="boom: simulated fault",
+    switchroom_shim=None,
+):
+    """Run recall.py as a subprocess after injecting a fault into a
+    lib helper called *during* main() so the top-level except handler
+    fires. We target ``lib.gateway_ipc.extract_chat_id_from_prompt``
+    because it's called unconditionally in the recall flow and
+    crucially does NOT touch lib.config — so the handler's own
+    ``load_config()`` call (used to decide on traceback verbosity)
+    still works.
+    ``switchroom_shim`` (optional) is shell script content; if
+    provided, a `switchroom` executable with that content is prepended
+    to PATH so the handler's subprocess call resolves to it instead
+    of (or instead of failing to find) the real CLI.
+    Returns the CompletedProcess.
+    """
+    shim = tmp_path / "fault_shim.py"
+    shim.write_text(
+        textwrap.dedent(
+            f"""\
+            import sys, os, runpy
+            sys.path.insert(0, {SCRIPTS_DIR!r})
+            from lib import gateway_ipc as _gw
+            def _boom(*a, **kw):
+                raise RuntimeError({fault_message!r})
+            _gw.extract_chat_id_from_prompt = _boom
+            # Run recall.py as __main__ so the top-level try/except
+            # block executes exactly as it does in production.
+            runpy.run_path({RECALL_PY!r}, run_name="__main__")
+            """
+        )
+    )
+    env = os.environ.copy()
+    # Strip any real HINDSIGHT_* / CLAUDE_PLUGIN_* env that might bleed in
+    for key in list(env):
+        if key.startswith(("HINDSIGHT_", "CLAUDE_PLUGIN_")):
+            env.pop(key, None)
+    env["HOME"] = str(tmp_path)
+    env["CLAUDE_PLUGIN_ROOT"] = str(tmp_path / "plugin_root")
+    env["CLAUDE_PLUGIN_DATA"] = str(tmp_path / "plugin_data")
+    (tmp_path / "plugin_root").mkdir(exist_ok=True)
+    (tmp_path / "plugin_data").mkdir(exist_ok=True)
+    if debug:
+        env["HINDSIGHT_DEBUG"] = "1"
+    # Path manipulation for the switchroom shim. We always isolate
+    # PATH so the test doesn't accidentally invoke a real `switchroom`
+    # on the host — that would write to a real state dir.
+    bindir = tmp_path / "bin"
+    bindir.mkdir(exist_ok=True)
+    if switchroom_shim is not None:
+        sw = bindir / "switchroom"
+        sw.write_text(switchroom_shim)
+        sw.chmod(0o755)
+    # Keep system path elements for /usr/bin/env etc., but put our
+    # bindir FIRST so any shim wins.
+    env["PATH"] = f"{bindir}:{env.get('PATH', '/usr/bin:/bin')}"
+    proc = subprocess.run(
+        [sys.executable, str(shim)],
+        input=json.dumps({"prompt": "anything", "session_id": "s"}),
+        capture_output=True,
+        text=True,
+        env=env,
+        timeout=15,
+    )
+    return proc
+# Default recording shim: writes argv (NUL-separated) + stdin into a
+# file under $SHIM_RECORD so the test can assert call shape. Exit 0.
+_RECORDING_SHIM = textwrap.dedent(
+    """\
+    #!/usr/bin/env bash
+    set -u
+    out="${SHIM_RECORD:-/tmp/sw-shim-record}"
+    {
+      for a in "$@"; do printf '%s\\0' "$a"; done
+      printf -- '---STDIN---\\n'
+      cat
+    } > "$out"
+    exit 0
+    """
+)
+class TestRecallExitCodes:
+    def test_nondebug_uncaught_exits_zero(self, tmp_path):
+        """Headline contract: a hindsight outage must NOT block the
+        user's prompt. exit 0 → Claude Code accepts the empty
+        additionalContext and proceeds with normal turn handling."""
+        proc = _run_recall_with_injected_fault(tmp_path, debug=False)
+        assert proc.returncode == 0, (
+            f"expected exit 0, got {proc.returncode}; "
+            f"stderr={proc.stderr!r}"
+        )
+    def test_nondebug_stdout_is_empty_memory_shape(self, tmp_path):
+        """Stdout must match the no-memories success-path shape. In
+        recall.py that path is a bare `return` with nothing dumped
+        to stdout (see line ~660 — the `if not directives_block and
+        not memories_block: return` branch). So stdout must be the
+        empty string."""
+        proc = _run_recall_with_injected_fault(tmp_path, debug=False)
+        assert proc.stdout == "", (
+            f"expected empty stdout, got {proc.stdout!r}"
+        )
+    def test_nondebug_stderr_includes_class_and_message(self, tmp_path):
+        """Operators reading journald need the class + message to
+        understand what broke. The full traceback stays gated behind
+        HINDSIGHT_DEBUG=1."""
+        proc = _run_recall_with_injected_fault(
+            tmp_path, debug=False, fault_message="kaboom-1070"
+        )
+        assert "RuntimeError" in proc.stderr
+        assert "kaboom-1070" in proc.stderr
+        assert "Unexpected error in recall" in proc.stderr
+    def test_nondebug_stderr_omits_traceback(self, tmp_path):
+        """#1069 threat model: don't dump tracebacks (which may
+        include local-variable repr in some frames or framework
+        internals) to unredacted stderr unless debug mode is on."""
+        proc = _run_recall_with_injected_fault(tmp_path, debug=False)
+        # The Python traceback module emits "Traceback (most recent
+        # call last):" as the first line. Its absence is the cheap,
+        # unambiguous check.
+        assert "Traceback (most recent call last)" not in proc.stderr, (
+            f"non-debug stderr leaked traceback: {proc.stderr!r}"
+        )
+    def test_nondebug_invokes_issues_record_subprocess(self, tmp_path):
+        """The substitute for the wrapper's record_failure path:
+        recall.py must shell out to `switchroom issues record` itself.
+        Assert the call argv shape via a recording shim on PATH."""
+        record_path = tmp_path / "shim_record.txt"
+        env_override_shim = _RECORDING_SHIM.replace(
+            '${SHIM_RECORD:-/tmp/sw-shim-record}', str(record_path)
+        )
+        proc = _run_recall_with_injected_fault(
+            tmp_path,
+            debug=False,
+            fault_message="kaboom-call-shape",
+            switchroom_shim=env_override_shim,
+        )
+        assert proc.returncode == 0
+        assert record_path.exists(), (
+            f"switchroom shim was not invoked; stderr={proc.stderr!r}"
+        )
+        raw = record_path.read_bytes()
+        head, _, tail = raw.partition(b"---STDIN---\n")
+        argv = [a.decode() for a in head.split(b"\x00") if a]
+        # Expected verb chain
+        assert argv[0:3] == ["issues", "record", "--severity"], argv
+        assert "warn" in argv
+        assert "--source" in argv
+        assert "hindsight.recall" in argv
+        assert "--code" in argv
+        assert "recall_failed" in argv
+        assert "--summary" in argv
+        # Summary contains the class
+        assert any(
+            "Hindsight recall failed: RuntimeError" in a for a in argv
+        ), argv
+        assert "--detail-stdin" in argv
+        assert "--quiet" in argv
+        # Stdin carries class + message
+        stdin_payload = tail.decode()
+        assert "RuntimeError" in stdin_payload
+        assert "kaboom-call-shape" in stdin_payload
+    def test_nondebug_issues_record_failure_does_not_propagate(self, tmp_path):
+        """If the shim exits non-zero (or the binary is missing or
+        hangs), recall.py must still exit 0 with the safe stdout
+        shape. The agent's responsiveness on a hindsight outage MUST
+        NOT depend on the issue sink also working."""
+        failing_shim = "#!/usr/bin/env bash\nexit 17\n"
+        proc = _run_recall_with_injected_fault(
+            tmp_path, debug=False, switchroom_shim=failing_shim
+        )
+        assert proc.returncode == 0, (
+            f"shim failure leaked through; rc={proc.returncode} "
+            f"stderr={proc.stderr!r}"
+        )
+        assert proc.stdout == ""
+    def test_nondebug_missing_switchroom_binary_does_not_propagate(self, tmp_path):
+        """The other failure mode: the binary isn't on PATH at all.
+        FileNotFoundError must be swallowed; agent still exits 0."""
+        # Empty bindir, no shim. PATH will only contain our empty
+        # bindir + system paths; system paths shouldn't have a
+        # `switchroom` on a test runner (and even if they do, the
+        # important thing is exit 0).
+        proc = _run_recall_with_injected_fault(
+            tmp_path, debug=False, switchroom_shim=None
+        )
+        # We can't assert the shim wasn't called (we didn't install
+        # one) but we CAN assert recall.py still exits 0.
+        assert proc.returncode == 0, (
+            f"missing-binary path leaked; rc={proc.returncode} "
+            f"stderr={proc.stderr!r}"
+        )
+    def test_nondebug_redacts_token_in_message(self, tmp_path):
+        """Exception messages from `lib/client.py:73` interpolate the
+        request URL into a RuntimeError; that URL may carry
+        `?api_key=...` or `Authorization: Bearer ...` in the body
+        echo. The redactor must scrub these from BOTH stderr and the
+        issues-record stdin payload.
+        Per repo convention (CLAUDE.md "Secrets in tests"), the
+        token-shaped fixture is built by string concatenation so the
+        source file never contains a contiguous secret-looking blob.
+        """
+        # Construct a fake token at runtime
+        fake_token = "sk" + "-" + "ant" + "-" + "a" * 40
+        fault_msg = (
+            "HTTP 401 from https://api.example.com/recall"
+            f"?api_key={fake_token}: unauthorized"
+        )
+        record_path = tmp_path / "shim_record.txt"
+        env_override_shim = _RECORDING_SHIM.replace(
+            '${SHIM_RECORD:-/tmp/sw-shim-record}', str(record_path)
+        )
+        proc = _run_recall_with_injected_fault(
+            tmp_path,
+            debug=False,
+            fault_message=fault_msg,
+            switchroom_shim=env_override_shim,
+        )
+        assert proc.returncode == 0
+        assert fake_token not in proc.stderr, (
+            f"token leaked to stderr: {proc.stderr!r}"
+        )
+        assert record_path.exists()
+        payload = record_path.read_bytes().decode("utf-8", errors="replace")
+        assert fake_token not in payload, (
+            f"token leaked to issues-record payload: {payload!r}"
+        )
+    def test_nondebug_redacts_bearer_in_message(self, tmp_path):
+        """Bearer-token shape is the other common leak vector."""
+        fake_bearer = "abcdef" + "0123456789" * 4
+        fault_msg = f"HTTP 401: Authorization: Bearer {fake_bearer} rejected"
+        proc = _run_recall_with_injected_fault(
+            tmp_path,
+            debug=False,
+            fault_message=fault_msg,
+            switchroom_shim=_RECORDING_SHIM,
+        )
+        assert proc.returncode == 0
+        assert fake_bearer not in proc.stderr, (
+            f"bearer leaked to stderr: {proc.stderr!r}"
+        )
+    def test_debug_exits_two_with_traceback(self, tmp_path):
+        """In debug mode, the traceback is allowed AND we exit 2.
+        Unchanged from the existing debug-branch behaviour."""
+        proc = _run_recall_with_injected_fault(tmp_path, debug=True)
+        assert proc.returncode == 2, (
+            f"expected exit 2 in debug, got {proc.returncode}; "
+            f"stderr={proc.stderr!r}"
+        )
+        assert "Traceback (most recent call last)" in proc.stderr, (
+            f"debug stderr missing traceback: {proc.stderr!r}"
+        )