PyPI - dos-kernel - Versions diffs - 0.22.0__py3-none-win_amd64.whl - Mend

dos-kernel 0.22.0__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (178) hide show

dos/__init__.py +261 -0
dos/_bin/dos-hook.exe +0 -0
dos/_filelock.py +255 -0
dos/_job_policy.py +97 -0
dos/_tree.py +145 -0
dos/admission.py +433 -0
dos/answer_shape.py +299 -0
dos/arbiter.py +859 -0
dos/archive_lock.py +266 -0
dos/arg_provenance.py +814 -0
dos/attest.py +472 -0
dos/breaker.py +311 -0
dos/churn.py +226 -0
dos/claim_extract.py +229 -0
dos/claim_ttl.py +150 -0
dos/cli.py +8721 -0
dos/commit_audit.py +666 -0
dos/completion.py +466 -0
dos/concurrency_class.py +154 -0
dos/config.py +1380 -0
dos/config_lint.py +464 -0
dos/cooldown.py +390 -0
dos/coverage.py +387 -0
dos/dangling_intent.py +287 -0
dos/data_class.py +397 -0
dos/decisions.py +1274 -0
dos/decisions_tui.py +251 -0
dos/dispatch_top.py +740 -0
dos/dispatch_top_tui.py +116 -0
dos/drivers/__init__.py +40 -0
dos/drivers/ci_status.py +630 -0
dos/drivers/citation_resolve.py +703 -0
dos/drivers/decision_stop.py +98 -0
dos/drivers/export_file.py +173 -0
dos/drivers/export_otlp.py +275 -0
dos/drivers/export_statsd.py +242 -0
dos/drivers/hook_dialects.py +391 -0
dos/drivers/job.py +47 -0
dos/drivers/llm_judge.py +360 -0
dos/drivers/memory_recall.py +1231 -0
dos/drivers/notify_slack.py +373 -0
dos/drivers/notify_webhook.py +251 -0
dos/drivers/operator_judge.py +114 -0
dos/drivers/os_acceptance.py +228 -0
dos/drivers/paste_log.py +132 -0
dos/drivers/plan_scope.py +133 -0
dos/drivers/self_improve.py +375 -0
dos/drivers/similarity_judge.py +249 -0
dos/drivers/state_diff.py +274 -0
dos/drivers/supervisor.py +347 -0
dos/drivers/watchdog.py +363 -0
dos/drivers/workshop.py +160 -0
dos/durable_schema.py +344 -0
dos/effect_witness.py +393 -0
dos/efficiency.py +318 -0
dos/enforce.py +414 -0
dos/enumerate.py +776 -0
dos/env_print.py +378 -0
dos/event_severity.py +258 -0
dos/evidence.py +692 -0
dos/exec_capability.py +256 -0
dos/export_cursor.py +143 -0
dos/exporter.py +320 -0
dos/firing_label.py +353 -0
dos/fleet_roll.py +226 -0
dos/gate_classify.py +827 -0
dos/gh4_coverage.py +179 -0
dos/git_delta.py +122 -0
dos/guard.py +215 -0
dos/health.py +552 -0
dos/help_summary.py +519 -0
dos/home.py +934 -0
dos/hook_binary.py +194 -0
dos/hook_dialect.py +271 -0
dos/hook_exit.py +191 -0
dos/hook_install.py +437 -0
dos/id_alloc.py +304 -0
dos/improve.py +499 -0
dos/intent_ledger.py +635 -0
dos/interpret.py +176 -0
dos/intervention.py +769 -0
dos/intervention_eval.py +371 -0
dos/journal_delta.py +308 -0
dos/judge_eval.py +328 -0
dos/judges.py +366 -0
dos/lane_infer.py +127 -0
dos/lane_journal.py +1001 -0
dos/lane_lease.py +952 -0
dos/lane_overlap.py +228 -0
dos/lease_health.py +282 -0
dos/lifecycle.py +211 -0
dos/liveness.py +352 -0
dos/lock_modes.py +185 -0
dos/log_source.py +395 -0
dos/loop_decide.py +1746 -0
dos/marker_gate.py +254 -0
dos/marker_sensor.py +396 -0
dos/noop_streak.py +280 -0
dos/notify.py +479 -0
dos/observe.py +175 -0
dos/oracle.py +1661 -0
dos/overlap_eval.py +214 -0
dos/overlap_policy.py +342 -0
dos/packet_sidecar.py +267 -0
dos/phase_shipped.py +1985 -0
dos/pick_priority.py +225 -0
dos/pickable.py +369 -0
dos/picker_oracle.py +1037 -0
dos/plan_board.py +513 -0
dos/plan_board_tui.py +113 -0
dos/plan_source.py +455 -0
dos/posttool_sensor.py +528 -0
dos/precursor_gate.py +499 -0
dos/precursor_gate_eval.py +239 -0
dos/preflight.py +825 -0
dos/pretool_sensor.py +490 -0
dos/proc_delta.py +181 -0
dos/productivity.py +296 -0
dos/provider_limit.py +242 -0
dos/py.typed +4 -0
dos/reason_morphology.py +299 -0
dos/reasons.py +449 -0
dos/reconcile.py +173 -0
dos/recurring_wedge.py +206 -0
dos/render.py +393 -0
dos/result_state.py +468 -0
dos/resume.py +578 -0
dos/resume_evidence.py +293 -0
dos/retention.py +344 -0
dos/reward.py +372 -0
dos/rewind.py +587 -0
dos/rewind_evidence.py +168 -0
dos/rewind_tokens.py +252 -0
dos/run_id.py +342 -0
dos/scope.py +520 -0
dos/scope_source.py +382 -0
dos/scout.py +982 -0
dos/self_modify.py +209 -0
dos/sibling_scan.py +569 -0
dos/skills/EXAMPLES.md +584 -0
dos/skills/dos-class-cycle/SKILL.md +107 -0
dos/skills/dos-dispatch/SKILL.md +177 -0
dos/skills/dos-dispatch-loop/SKILL.md +254 -0
dos/skills/dos-goal-gate/SKILL.md +269 -0
dos/skills/dos-next-up/SKILL.md +231 -0
dos/skills/dos-promote/SKILL.md +114 -0
dos/skills/dos-replan/SKILL.md +159 -0
dos/skills/dos-replan-loop/SKILL.md +114 -0
dos/skills/dos-self-improve/SKILL.md +213 -0
dos/skills/dos-supervise-loop/SKILL.md +180 -0
dos/skills/dos-unstick/SKILL.md +108 -0
dos/skills/dos-witness-claim/SKILL.md +251 -0
dos/stamp.py +1002 -0
dos/state_health.py +387 -0
dos/status.py +114 -0
dos/stop_policy.py +334 -0
dos/supervise.py +1014 -0
dos/testwitness.py +392 -0
dos/timeline.py +1027 -0
dos/tokens.py +485 -0
dos/tool_stream.py +393 -0
dos/tool_stream_eval.py +226 -0
dos/trace.py +524 -0
dos/verdict.py +140 -0
dos/verdict_cli.py +189 -0
dos/verdict_journal.py +497 -0
dos/verdict_rollup.py +217 -0
dos/verdicts.py +181 -0
dos/wedge_reason.py +282 -0
dos_kernel-0.22.0.dist-info/METADATA +859 -0
dos_kernel-0.22.0.dist-info/RECORD +178 -0
dos_kernel-0.22.0.dist-info/WHEEL +5 -0
dos_kernel-0.22.0.dist-info/entry_points.txt +39 -0
dos_kernel-0.22.0.dist-info/licenses/LICENSE +21 -0
dos_kernel-0.22.0.dist-info/top_level.txt +2 -0
dos_mcp/__init__.py +52 -0
dos_mcp/py.typed +2 -0
dos_mcp/server.py +779 -0

dos/resume_evidence.py ADDED Viewed

@@ -0,0 +1,293 @@
+"""resume-evidence — the boundary I/O for the resume axis (docs/107 §3.3, §5).
+`resume.resume_plan` is a PURE verdict over `AncestryFacts` (which claimed SHAs are
+in ancestry). SOMETHING has to gather those facts from git, and SOMETHING has to
+mint a `STEP_VERIFIED` by re-checking a claimed SHA against the non-forgeable rung
+(§5 req 2). That is this module — the resume axis's `git_delta`/`journal_delta`:
+boundary I/O (subprocess + the served root) feeding the pure core, never inside the
+verdict.
+Two boundary jobs:
+  * **`gather_ancestry(...)`** — ask git which of a set of claimed SHAs are
+    reachable from HEAD on the served workspace, and freeze the answer into the
+    `AncestryFacts` the pure `resume_plan` consumes. The `liveness` evidence-gather
+    shape: the subprocess happens HERE, the already-decided membership is handed to
+    the classifier.
+  * **`verify_step(...)`** — the `STEP_VERIFIED` MINT (§5). Given a claimed
+    `(step_id, sha)`, decide whether it may become a minted belief: the SHA must be
+    **in ancestry** AND the commit must stand on the **non-forgeable rung** (it
+    touched ≥1 distinctive file — NOT an `--allow-empty` commit, NOT a
+    bookkeeping/release-bump-only footprint). A step that passes yields a
+    `STEP_VERIFIED` entry tagged `via="file-path"`; one that fails yields *nothing*
+    (it stays in the residual). **A forged `--allow-empty` step never reaches
+    `STEP_VERIFIED`** — the load-bearing Phase-3 guarantee.
+The served root is passed EXPLICITLY (never the process-global active config), so a
+long-lived caller fielding several workspaces — the MCP server, a fleet daemon —
+gets the right tree (the `git_delta` discipline). Every failure mode degrades to
+the SAFE direction: a SHA we cannot resolve is treated as NOT in ancestry / NOT
+verifiable (fail-closed — a step we cannot prove landed must be redone, never
+skipped), the opposite of `git_delta`'s permissive empty (because here the safe
+direction for a *resume anchor* is "don't trust it," whereas for a *liveness
+delta* it is "no progress observed").
+"""
+from __future__ import annotations
+import subprocess
+from pathlib import Path
+from typing import Iterable
+from dos import config as _config
+from dos import intent_ledger as _il
+from dos.intent_ledger import LedgerState
+from dos.resume import AncestryFacts
+_GIT_TIMEOUT_S = 15
+def _is_ancestor(sha: str, *, root: Path | str) -> bool:
+    """True iff `sha` is reachable from HEAD (an ancestor) on `root`. Fail-closed.
+    `git merge-base --is-ancestor <sha> HEAD` exits 0 iff `sha` is an ancestor of
+    HEAD, 1 iff not, and >1 on error (bad sha, not a git dir). We treat ONLY a
+    clean exit-0 as "in ancestry" — every other outcome (unknown sha, git missing,
+    timeout, non-git dir) is `False` (the safe direction for a resume anchor: a SHA
+    we cannot prove is reachable must not anchor a resume point). The opposite of
+    `git_delta`'s permissive-empty, because the safe failure here is "don't trust."
+    """
+    s = (sha or "").strip()
+    if not s:
+        return False
+    try:
+        res = subprocess.run(
+            ["git", "merge-base", "--is-ancestor", s, "HEAD"],
+            cwd=str(root),
+            capture_output=True,
+            text=True,
+            check=False,
+            timeout=_GIT_TIMEOUT_S,
+        )
+    except (OSError, subprocess.TimeoutExpired):
+        return False
+    return res.returncode == 0
+def _touched_files(sha: str, *, root: Path | str) -> set[str] | None:
+    """The repo-relative paths commit `sha` touched on `root`, or None if unresolvable.
+    The explicit-root sibling of `oracle._git_touched_files` (which reads the
+    process-global active config). None means "could not resolve" (unknown sha,
+    shallow clone, git missing) — the caller treats it as NOT verifiable
+    (fail-closed). An EMPTY set means the commit touched NO files: an `--allow-empty`
+    commit — the exact forgeable case §5 req 2 forecloses.
+    """
+    s = (sha or "").strip()
+    if not s:
+        return None
+    try:
+        res = subprocess.run(
+            ["git", "show", "--name-only", "--format=", s],
+            cwd=str(root),
+            capture_output=True,
+            text=True,
+            encoding="utf-8",
+            errors="replace",
+            timeout=_GIT_TIMEOUT_S,
+            check=False,
+        )
+    except (OSError, subprocess.TimeoutExpired):
+        return None
+    if res.returncode != 0:
+        return None
+    return {ln.strip().replace("\\", "/") for ln in res.stdout.splitlines() if ln.strip()}
+def step_stands_on_nonforgeable_rung(
+    sha: str, *, root: Path | str,
+    region: "list[str] | tuple[str, ...] | None" = None,
+    touched_files=None,
+    is_ancestor=None,
+) -> bool:
+    """True iff `sha` is a SAFE resume anchor — in ancestry AND its footprint is real (§5).
+    The §5-req-2 predicate, the heart of the mint. A claimed step's SHA earns a
+    `STEP_VERIFIED` ONLY when all hold:
+      1. **In ancestry.** The commit is reachable from HEAD (`_is_ancestor`). A
+         claimed SHA that is not in ancestry is a step the agent SAID it landed but
+         never did (or that was rewritten out) — fail-closed, not verified.
+      2. **Non-forgeable footprint.** The commit touched ≥1 real file. An
+         `--allow-empty` commit (the forgeable rung §5 names: an empty commit whose
+         SUBJECT names the step) touches NO files, so it fails this — exactly the
+         named attack.
+      3. **Footprint INTERSECTS the step's declared region (when one is declared).**
+         This closes the residual §5 hole the adversarial review found: requirement 2
+         alone defeats `--allow-empty` but NOT a forged record pointing at any *real,
+         unrelated* commit (the attacker needs only ANY ancestry SHA). When the step
+         declared a file region (a list of repo-relative globs in its INTENT), the
+         commit's touched-file set must OVERLAP that region — a commit that touched
+         only files OUTSIDE the step's region is not that step's work, even if it is a
+         real ancestry commit. Overlap reuses the kernel's ONE collision algebra
+         (`_tree.lane_trees_disjoint`, case-folded / leading-glob-aware) so there is
+         no second match definition. A step with NO declared region falls back to
+         requirement 2 only (the `--allow-empty` defense) — additive, so a region-less
+         ledger still gets real protection, just not region-pinned.
+    `touched_files` / `is_ancestor` are injectable (callable(sha)->set|None and
+    callable(sha)->bool) so the predicate is unit-testable WITHOUT git — the
+    `oracle`/`liveness` injection discipline. Production passes neither and the
+    git-backed defaults run against `root`.
+    """
+    anc = is_ancestor or (lambda x: _is_ancestor(x, root=root))
+    touch = touched_files or (lambda x: _touched_files(x, root=root))
+    if not anc(sha):
+        return False
+    files = touch(sha)
+    if not files:  # None (unresolvable) OR empty (--allow-empty) → not a safe anchor
+        return False
+    if region:
+        # The footprint must OVERLAP the step's declared region. The concrete touched
+        # files are treated as zero-wildcard "globs"; intersection is the negation of
+        # the kernel's disjointness verdict — one algebra, no drift.
+        from dos._tree import lane_trees_disjoint
+        if lane_trees_disjoint(list(files), list(region)):
+            return False  # commit touched only files OUTSIDE the step's region
+    return True
+def verify_step(
+    run_id: str,
+    step_id: str,
+    sha: str,
+    *,
+    cfg: "_config.SubstrateConfig | None" = None,
+    path: Path | None = None,
+    region: "list[str] | tuple[str, ...] | None" = None,
+    touched_files=None,
+    is_ancestor=None,
+) -> dict | None:
+    """Mint a `STEP_VERIFIED` for `(step_id, sha)` IFF it stands on the non-forgeable rung.
+    The CLI-boundary write the dispatch loop / `dos resume verify-step` calls after
+    an agent claims a step. Re-checks the claimed SHA against ancestry on the
+    non-forgeable rung (`step_stands_on_nonforgeable_rung`, incl. the `region`
+    intersection when one is declared); on success appends a `STEP_VERIFIED` entry
+    (tagged `via="file-path"`) to the run's ledger and returns the stamped entry; on
+    failure appends NOTHING and returns None (the step stays in the residual — a
+    forged/unverifiable claim is never minted into a belief).
+    This is the §5-req-2 guarantee in code: a step the agent merely CLAIMED — claimed
+    with an `--allow-empty` commit, or claimed against a real-but-unrelated commit
+    outside its declared region — cannot reach `STEP_VERIFIED`, so it can never become
+    a resume anchor that skips work that never happened.
+    """
+    cfg = _config.ensure(cfg)
+    if not step_stands_on_nonforgeable_rung(
+        sha, root=cfg.paths.root, region=region,
+        touched_files=touched_files, is_ancestor=is_ancestor,
+    ):
+        return None
+    entry = _il.step_verified_entry(step_id, sha, via="file-path")
+    return _il.append(run_id, entry, path=path, cfg=cfg)
+def adjudicate_verified_steps(
+    state: LedgerState,
+    *,
+    root: Path | str,
+    touched_files=None,
+    is_ancestor=None,
+) -> frozenset[str]:
+    """Re-adjudicate, at READ time, which steps stand on the non-forgeable rung (§5).
+    The docs/107 §5 / docs/103 fix, and the heart of "the kernel doesn't believe the
+    agents." The intent ledger is written BY the distrusted run, so a stored
+    `STEP_VERIFIED` record is an UNAUTHENTICATED HINT — a malicious run can append its
+    own `STEP_VERIFIED {via: "file-path", sha: <any real ancestry commit>}` for a step
+    it never did. This RE-RUNS the non-forgeable footprint check
+    (`step_stands_on_nonforgeable_rung`) on each step's SHA, and returns ONLY the step
+    ids that pass — the authority the pure `resume_plan` trusts for "done"
+    (`AncestryFacts.steps_verified_at_read`), never the agent's say-so.
+    For each declared step we re-check the step's SHA — preferring the
+    `STEP_VERIFIED` record's recorded SHA, falling back to the `STEP_CLAIMED` SHA —
+    against `step_stands_on_nonforgeable_rung` (in ancestry AND a real, non-empty
+    footprint). A forged record pointing at an unrelated empty/foreign commit fails
+    the footprint re-check (an `--allow-empty` forgery touches nothing; a record with
+    no real SHA resolves to nothing) and is absent from the result, so the step is
+    redone. `touched_files`/`is_ancestor` are injectable for tests (no git needed).
+    NOTE on the residual hardening: this re-check confirms the commit is a real
+    artefact in ancestry; a future tightening (the review's strongest suggestion)
+    would also require the footprint to INTERSECT the step's declared file region, so
+    a real-but-unrelated commit can't anchor a step. That needs per-step declared
+    regions the ledger doesn't yet carry; the non-empty-footprint + ancestry re-check
+    already defeats the `--allow-empty` forgery the §5 attack names, and a real commit
+    falsely claimed for a step is still strictly safer than trusting the stored record.
+    """
+    out: set[str] = set()
+    for sid in state.declared_steps:
+        vs = state.verified.get(sid)
+        sha = (vs.sha if vs and vs.sha else state.claimed.get(sid, ""))
+        if not sha:
+            continue
+        region = state.step_regions.get(sid)  # the step's declared file region (or None)
+        if step_stands_on_nonforgeable_rung(
+            sha, root=root, region=region,
+            touched_files=touched_files, is_ancestor=is_ancestor,
+        ):
+            out.add(sid)
+    return frozenset(out)
+def gather_ancestry(
+    state: LedgerState,
+    *,
+    cfg: "_config.SubstrateConfig | None" = None,
+    extra_shas: Iterable[str] = (),
+    lane_advanced_past_resume: bool = False,
+    is_ancestor=None,
+    touched_files=None,
+    head_sha: str = "",
+) -> AncestryFacts:
+    """Freeze the RE-ADJUDICATED ancestry facts `resume_plan` needs (§3.3, §5).
+    The boundary evidence-gather (the `liveness` CLI shape). Two reads, both at this
+    boundary, never inside the pure verdict:
+      1. **Ancestry membership** — collect every SHA the ledger mentions (claimed +
+         verified + start + `extra_shas`) and ask git which are ancestors of HEAD on
+         the served workspace (`_is_ancestor`, explicit root).
+      2. **Step re-adjudication (the §5 fix)** — RE-RUN the non-forgeable footprint
+         check on each declared step (`adjudicate_verified_steps`), so the pure
+         verdict's "done" set comes from a fresh git re-check, NOT from the
+         agent-written `STEP_VERIFIED` record. A forged record is rejected here.
+    `lane_advanced_past_resume` is computed by the CALLER (it knows the lane's tree
+    and the commits since the resume point); the verdict only consumes it.
+    `is_ancestor`/`touched_files` are injectable for tests (the `oracle` injection
+    discipline). The result is handed verbatim to the pure `resume.resume_plan`.
+    """
+    cfg = _config.ensure(cfg)
+    root = cfg.paths.root
+    anc = is_ancestor or (lambda x: _is_ancestor(x, root=root))
+    candidates: set[str] = set()
+    if state.start_sha:
+        candidates.add(state.start_sha)
+    candidates.update(s for s in state.claimed.values() if s)
+    candidates.update(vs.sha for vs in state.verified.values() if vs.sha)
+    candidates.update(s for s in extra_shas if s)
+    in_ancestry = frozenset(s for s in candidates if anc(s))
+    verified_at_read = adjudicate_verified_steps(
+        state, root=root, touched_files=touched_files, is_ancestor=is_ancestor,
+    )
+    return AncestryFacts(
+        shas_in_ancestry=in_ancestry,
+        steps_verified_at_read=verified_at_read,
+        head_sha=head_sha,
+        lane_advanced_past_resume=lane_advanced_past_resume,
+    )

dos/retention.py ADDED Viewed

@@ -0,0 +1,344 @@
+"""The retention policy — how much DOS scratch to keep, *as data*.
+This is the direct answer to the question [`docs/94 §7`](../docs/94_checkpoints-and-recovery-from-slop.md)
+left open and [`docs/106 §3.3`](../docs/106_garbage-collection-and-the-reachability-verdict.md)
+specified: **retention is policy, so it is declared per-workspace and carried on
+the config seam as data** — the `docs/HACKING.md` closed-enum→declared-data
+pattern that already governs `[reasons]` and `[stamp]`.
+Why a seam and not a constant
+=============================
+DOS has the garbage-collection *problem* in two shapes the operator feels (the
+append-only lane journal that grows without bound, and the per-project `.dos/`
+scratch — run-dirs, verdict sidecars, **audit reports** — that nobody auto-reaps).
+docs/106 argues the collector itself is NOT new machinery: `replay`+`compact` is
+already a correct mark-and-copy collector, missing only a *trigger*, a
+*generational split*, and a *safe-point*. The trigger needs a *threshold*, and a
+threshold is a number a host should be able to set (a host on a tiny disk keeps
+little; a host that wants a long forensic tail keeps lots). That number is policy,
+so it rides `SubstrateConfig` next to `.reasons`/`.stamp`/`.overlap_ratio_max`,
+declarable in `dos.toml [retention]`, with a **generic default that is never zero**.
+The floor is NOT these numbers
+==============================
+The load-bearing safety floor (docs/106 §5) is *reachability*, enforced by the
+collector independently of any retention count: **a live lease is never collected,
+ever**, regardless of how small the caps are set. A misconfigured `[retention]`
+may keep *too much* (waste disk) — `False`-keep is tolerable — but it must never
+cause a `False`-collect of state the kernel still needs. So this module carries
+only the *recency / size* knobs; the "never reap a live lease" invariant lives in
+the collector (the journal `compact` fold and the reaper's liveness gate), not
+here. These numbers tune *how aggressively* to collect the already-collectable;
+they cannot loosen *what* is collectable.
+The shape
+=========
+A `RetentionPolicy` is the closed set of size/recency caps, plus one pure
+predicate the kernel exposes for the trigger:
+  * ``should_compact(entries, policy, *, now_ms)`` — `True` when the journal has
+    more than ``journal_max_entries`` lines OR its oldest non-checkpoint entry is
+    older than ``journal_max_age_days``. Reads ONLY the materialized list
+    `read_all` already produced (no extra I/O) — the docs/106 §3.2 threshold,
+    pure, so a driver fires it on a cadence the way `dos watch` fires
+    `liveness.classify`.
+The *reapers* that consume the keep-last-N caps (run-dirs / verdicts / audits)
+live in the helper/driver layer (they do filesystem I/O — `os.scandir`, `unlink`),
+never in this pure leaf; this module only declares the numbers and the one pure
+threshold. That is the same kernel/driver split as `overlap_policy` (the seam is
+data; the scorer that does work is a driver) — I/O at the boundary, data to the
+pure core.
+Two named constants ship in the package:
+  * ``GENERIC_RETENTION`` — the generic default: generous caps, never zero. This
+    is what every workspace gets out of the box (the floor is "never reap a live
+    lease," which the collector enforces independently of these numbers).
+  * ``UNBOUNDED_RETENTION`` — every cap effectively infinite + ``should_compact``
+    always `False`. The opt-out for a host that wants today's keep-everything
+    behaviour explicitly (and the byte-faithful baseline for any consumer built
+    before this seam existed).
+Pure stdlib — no third-party imports, no I/O (the `load_from_toml` half opens the
+toml file at the call boundary, exactly as `stamp.load_from_toml` does, and is the
+only function here that touches the disk). Leaf module: nothing in the kernel
+imports *down* into a driver to use it.
+"""
+from __future__ import annotations
+from dataclasses import dataclass, replace
+from pathlib import Path
+from typing import Any, Mapping
+# A day in milliseconds — the journal `ts` rung and `should_compact` both speak ms
+# (the same unit `journal_delta`/`liveness` use), so the age cap is converted once
+# here rather than scattering `* 86_400_000` at the call sites.
+_MS_PER_DAY = 86_400_000
+# A sentinel "no cap" for the keep-last-N / max-entries knobs. `None` means "keep
+# everything on this axis" — distinct from `0` (which would mean "keep nothing",
+# a foot-gun the floor forbids but the data type should still be able to express
+# for an explicit opt-out). The predicate treats `None` as "this rung never fires."
+NO_CAP: None = None
+@dataclass(frozen=True)
+class RetentionPolicy:
+    """The per-workspace scratch-retention caps, as immutable data.
+    Every field is optional-with-a-default; a host overrides only what it cares
+    about in `dos.toml [retention]`. ``None`` on any cap means "unbounded on this
+    axis" (keep everything) — NOT zero. The caps are size/recency tuning; the
+    "never collect a live lease" floor is the collector's, not this object's.
+      * ``journal_max_entries`` — compact the WAL when it grows past this many
+        lines. ``None`` = never compact by size. (docs/106 §3.2)
+      * ``journal_max_age_days`` — …or when its oldest non-checkpoint entry is
+        older than this. ``None`` = never compact by age. (IDE checkpointers
+        persist ~30d — the docs/94 §7 calibration anchor.)
+      * ``runs_keep_last`` — reap `.dos/runs/` run-dirs beyond the newest N
+        (liveness-gated by the reaper: a live run is kept even if old). ``None`` =
+        keep all run-dirs.
+      * ``verdicts_keep_last`` — reap `.dos/**/.verdict-*.json` beyond the newest
+        N. A verdict is a point-in-time artifact with no liveness, so recency is
+        the honest rule. ``None`` = keep all verdicts.
+      * ``audits_keep_last`` — reap `.dos/audits/trajectory-audit-*` beyond the
+        newest N. The scratch class the 2026-06-03 trajectory audit surfaced (NOT
+        in docs/106 §1.2's original table — the audit's own output is itself an
+        unbounded-growth source). Same recency rule as verdicts. ``None`` = keep
+        all audit reports.
+      * ``projections_compact`` — when ``True``, let `dos reindex` *rewrite* the
+        central `~/.dos` projections to their live digest, not only append/prune.
+        (docs/106 §3.4)
+    """
+    journal_max_entries: int | None = 5000
+    journal_max_age_days: float | None = 30.0
+    runs_keep_last: int | None = 200
+    verdicts_keep_last: int | None = 500
+    audits_keep_last: int | None = 200
+    projections_compact: bool = True
+    def with_overrides(self, **changes: Any) -> "RetentionPolicy":
+        """Return a copy with the named caps replaced (thin `dataclasses.replace`)."""
+        return replace(self, **changes)
+# The generic default — generous, never zero. Every workspace gets this out of the
+# box. The numbers are deliberately provisional (docs/106 §6: "generous-and-
+# provisional, floored on 'never collect a live lease,' with the bench as the
+# eventual evidence source"); the floor that makes them SAFE is the collector's
+# reachability gate, not these values.
+GENERIC_RETENTION = RetentionPolicy()
+# The explicit keep-everything opt-out: every cap unbounded, `should_compact`
+# always False. The byte-faithful "no retention seam" baseline — a consumer that
+# installs this behaves exactly as the kernel did before `[retention]` existed.
+UNBOUNDED_RETENTION = RetentionPolicy(
+    journal_max_entries=NO_CAP,
+    journal_max_age_days=NO_CAP,
+    runs_keep_last=NO_CAP,
+    verdicts_keep_last=NO_CAP,
+    audits_keep_last=NO_CAP,
+    projections_compact=False,
+)
+def should_compact(
+    entries: list[Mapping[str, Any]],
+    policy: RetentionPolicy = GENERIC_RETENTION,
+    *,
+    now_ms: int,
+) -> bool:
+    """The pure auto-compaction threshold (docs/106 §3.2).
+    `True` when the journal is over ``journal_max_entries`` lines OR its oldest
+    non-checkpoint entry is older than ``journal_max_age_days``. Reads ONLY the
+    already-materialized ``entries`` list (the one `lane_journal.read_all`
+    produces) plus the supplied ``now_ms`` clock — no I/O, so a driver fires it on
+    a cadence the way `dos watch` fires `liveness.classify`. The clock is HANDED
+    in (the way a pure verdict is handed a clock), never read here.
+    A cap of ``None`` makes its rung never fire. Both caps ``None`` (or an empty
+    journal) ⇒ `False`. The predicate is monotone in journal size: it can only ask
+    to collect *more* as the log grows, never less — it never blocks a compaction
+    the operator triggers by hand, it only decides when one should fire on its own.
+    Note this is a *should-we* signal, not a *may-we* safety check: the SAFE point
+    to actually run `compact` (the beat-anchor caveat, docs/106 §3.2(ii)) is the
+    collector/driver's concern. A `True` here means "the journal is big/old enough
+    to be worth collecting," not "it is safe to collect this instant."
+    """
+    n = len(entries)
+    if not n:
+        return False
+    max_entries = policy.journal_max_entries
+    if max_entries is not None and n > max_entries:
+        return True
+    max_age_days = policy.journal_max_age_days
+    if max_age_days is not None:
+        oldest = _oldest_non_checkpoint_ms(entries)
+        if oldest is not None and (now_ms - oldest) > max_age_days * _MS_PER_DAY:
+            return True
+    return False
+def plan_reap(
+    entries: list[tuple[str, float]], keep_last: int | None
+) -> list[str]:
+    """The pure keep-last-N reaper plan: which entries to DROP by recency.
+    ``entries`` is ``[(identifier, mtime_seconds), ...]`` — the reaper gathers it
+    at the I/O boundary (`os.scandir`), this function decides. Keeps the ``keep_last``
+    newest by ``mtime`` (ties broken by identifier, descending, so the order is
+    total and deterministic) and returns the identifiers to drop, NEWEST-DROPPED
+    first is NOT guaranteed — the returned list is the drop SET as a list; callers
+    that want a stable display sort it. ``keep_last=None`` (unbounded) ⇒ drop
+    nothing. ``keep_last=0`` ⇒ drop everything (an explicit "keep none"; the
+    collector's reachability floor still spares anything live, but that gate is the
+    I/O reaper's, applied BEFORE this — see `home.reap_scratch`).
+    Pure: no I/O, no clock. This is the recency half of docs/106 §3.4 ("a verdict
+    is a point-in-time artifact with no liveness, so recency is the honest rule"),
+    factored out of the filesystem walk so it is unit-testable in isolation — the
+    same kernel/driver split as `should_compact` (pure threshold) vs the driver
+    that fires `compact`.
+    """
+    if keep_last is None:
+        return []
+    if keep_last <= 0:
+        return [ident for ident, _ in entries]
+    # Newest first: primary key mtime desc, secondary identifier desc (total order).
+    ordered = sorted(entries, key=lambda em: (em[1], em[0]), reverse=True)
+    return [ident for ident, _ in ordered[keep_last:]]
+def _oldest_non_checkpoint_ms(entries: list[Mapping[str, Any]]) -> int | None:
+    """The smallest ``ts`` over non-CHECKPOINT entries, or None if none carry one.
+    Checkpoints are excluded because a CHECKPOINT line is the *snapshot* a prior
+    compaction wrote, not original history — counting its age would make a
+    freshly-compacted journal look stale and re-trigger immediately (a compaction
+    loop). A line with no parseable integer ``ts`` is skipped (the same forgiving
+    posture `journal_delta` takes on a malformed beat) rather than crashing the
+    threshold.
+    """
+    oldest: int | None = None
+    for e in entries:
+        if e.get("op") == "CHECKPOINT":
+            continue
+        ts = e.get("ts")
+        if not isinstance(ts, int):
+            continue
+        if oldest is None or ts < oldest:
+            oldest = ts
+    return oldest
+# ---------------------------------------------------------------------------
+# The `dos.toml [retention]` reader — the data attachment, file I/O at the boundary.
+# Mirrors `stamp.load_from_toml` / `config.load_overlap_from_toml` in shape.
+# ---------------------------------------------------------------------------
+# The cap fields that take an int|None. `journal_max_age_days` is float|None and is
+# coerced separately; `projections_compact` is a bool. Splitting them keeps the
+# per-field coercion honest (an int cap rejects 1.5; the age accepts it).
+_INT_CAP_KEYS = frozenset({
+    "journal_max_entries", "runs_keep_last", "verdicts_keep_last", "audits_keep_last",
+})
+_FLOAT_CAP_KEYS = frozenset({"journal_max_age_days"})
+_BOOL_KEYS = frozenset({"projections_compact"})
+_ALLOWED_KEYS = _INT_CAP_KEYS | _FLOAT_CAP_KEYS | _BOOL_KEYS
+def policy_from_table(
+    table: Mapping[str, Any], *, base: RetentionPolicy = GENERIC_RETENTION
+) -> RetentionPolicy:
+    """Build a `RetentionPolicy` from a parsed `[retention]` table, over ``base``.
+    A present key OVERRIDES the corresponding base field; an absent key inherits
+    it. An UNKNOWN key raises `ValueError` (a typo'd cap — ``runs_keep_lsat`` —
+    is a host mistake worth surfacing loudly, the same posture every other seam
+    reader takes). A cap may be set to the TOML value ``-1`` or the string
+    ``"none"`` to mean "unbounded on this axis" (the `None` sentinel — TOML has no
+    null literal, so we accept those two spellings); any other negative is a
+    mistake and raises. ``0`` is accepted verbatim (an explicit "keep nothing" the
+    collector's reachability floor still overrides for live state).
+    """
+    if not isinstance(table, Mapping):
+        raise ValueError(f"[retention] must be a table, got {type(table).__name__}")
+    unknown = set(table) - _ALLOWED_KEYS
+    if unknown:
+        raise ValueError(
+            f"unknown [retention] key(s): {', '.join(sorted(unknown))} "
+            f"(allowed: {', '.join(sorted(_ALLOWED_KEYS))})"
+        )
+    changes: dict[str, Any] = {}
+    for key in _INT_CAP_KEYS & set(table):
+        changes[key] = _coerce_cap(table[key], key, integral=True)
+    for key in _FLOAT_CAP_KEYS & set(table):
+        changes[key] = _coerce_cap(table[key], key, integral=False)
+    for key in _BOOL_KEYS & set(table):
+        raw = table[key]
+        if not isinstance(raw, bool):
+            raise ValueError(f"[retention] {key} must be a boolean, got {raw!r}")
+        changes[key] = raw
+    return replace(base, **changes)
+def _coerce_cap(raw: Any, key: str, *, integral: bool) -> int | float | None:
+    """Coerce one cap value: a number, or the `None`-sentinel spellings.
+    TOML has no null, so ``-1`` and the (case-insensitive) string ``"none"`` both
+    mean "unbounded on this axis." A non-negative number is taken as the cap; any
+    other negative, or a non-numeric non-``"none"`` value, raises.
+    """
+    if isinstance(raw, str) and raw.strip().lower() == "none":
+        return None
+    if isinstance(raw, bool):  # bool is an int subclass — reject it for a cap
+        raise ValueError(f"[retention] {key} must be a number or \"none\", got {raw!r}")
+    if not isinstance(raw, (int, float)):
+        raise ValueError(f"[retention] {key} must be a number or \"none\", got {raw!r}")
+    if raw == -1:
+        return None
+    if raw < 0:
+        raise ValueError(
+            f"[retention] {key} must be >= 0 (or -1 / \"none\" for unbounded), got {raw!r}"
+        )
+    return int(raw) if integral else float(raw)
+def load_from_toml(
+    path: Path | str, *, base: RetentionPolicy = GENERIC_RETENTION
+) -> RetentionPolicy:
+    """Build a `RetentionPolicy` from a `dos.toml`'s `[retention]` table.
+    Returns ``base`` unchanged when the file is absent, has no `[retention]` table,
+    or `tomllib` is unavailable (Python < 3.11 with no `tomli`) — the declarative
+    path is purely additive, so a missing/empty config degrades to the supplied
+    base, never an error. A *present but malformed* `[retention]` table raises
+    (`policy_from_table`), surfaced by `load_workspace_config`'s warn-and-fall-back.
+    Mirrors `stamp.load_from_toml` / `reasons.load_from_toml` exactly.
+    """
+    p = Path(path)
+    if not p.exists():
+        return base
+    try:
+        import tomllib  # py3.11+
+    except ModuleNotFoundError:  # pragma: no cover - py<3.11 fallback
+        try:
+            import tomli as tomllib  # type: ignore
+        except ModuleNotFoundError:
+            return base
+    # `utf-8-sig` strips a UTF-8 BOM (PowerShell's `utf8` writes one) — the same
+    # fix as `config._load_toml_table` / `stamp.load_from_toml`.
+    data = tomllib.loads(p.read_text(encoding="utf-8-sig"))
+    table = data.get("retention")
+    if not isinstance(table, dict) or not table:
+        return base
+    return policy_from_table(table, base=base)