PyPI - dos-kernel - Versions diffs - 0.22.0__py3-none-win_amd64.whl - Mend

dos-kernel 0.22.0__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (178) hide show

dos/__init__.py +261 -0
dos/_bin/dos-hook.exe +0 -0
dos/_filelock.py +255 -0
dos/_job_policy.py +97 -0
dos/_tree.py +145 -0
dos/admission.py +433 -0
dos/answer_shape.py +299 -0
dos/arbiter.py +859 -0
dos/archive_lock.py +266 -0
dos/arg_provenance.py +814 -0
dos/attest.py +472 -0
dos/breaker.py +311 -0
dos/churn.py +226 -0
dos/claim_extract.py +229 -0
dos/claim_ttl.py +150 -0
dos/cli.py +8721 -0
dos/commit_audit.py +666 -0
dos/completion.py +466 -0
dos/concurrency_class.py +154 -0
dos/config.py +1380 -0
dos/config_lint.py +464 -0
dos/cooldown.py +390 -0
dos/coverage.py +387 -0
dos/dangling_intent.py +287 -0
dos/data_class.py +397 -0
dos/decisions.py +1274 -0
dos/decisions_tui.py +251 -0
dos/dispatch_top.py +740 -0
dos/dispatch_top_tui.py +116 -0
dos/drivers/__init__.py +40 -0
dos/drivers/ci_status.py +630 -0
dos/drivers/citation_resolve.py +703 -0
dos/drivers/decision_stop.py +98 -0
dos/drivers/export_file.py +173 -0
dos/drivers/export_otlp.py +275 -0
dos/drivers/export_statsd.py +242 -0
dos/drivers/hook_dialects.py +391 -0
dos/drivers/job.py +47 -0
dos/drivers/llm_judge.py +360 -0
dos/drivers/memory_recall.py +1231 -0
dos/drivers/notify_slack.py +373 -0
dos/drivers/notify_webhook.py +251 -0
dos/drivers/operator_judge.py +114 -0
dos/drivers/os_acceptance.py +228 -0
dos/drivers/paste_log.py +132 -0
dos/drivers/plan_scope.py +133 -0
dos/drivers/self_improve.py +375 -0
dos/drivers/similarity_judge.py +249 -0
dos/drivers/state_diff.py +274 -0
dos/drivers/supervisor.py +347 -0
dos/drivers/watchdog.py +363 -0
dos/drivers/workshop.py +160 -0
dos/durable_schema.py +344 -0
dos/effect_witness.py +393 -0
dos/efficiency.py +318 -0
dos/enforce.py +414 -0
dos/enumerate.py +776 -0
dos/env_print.py +378 -0
dos/event_severity.py +258 -0
dos/evidence.py +692 -0
dos/exec_capability.py +256 -0
dos/export_cursor.py +143 -0
dos/exporter.py +320 -0
dos/firing_label.py +353 -0
dos/fleet_roll.py +226 -0
dos/gate_classify.py +827 -0
dos/gh4_coverage.py +179 -0
dos/git_delta.py +122 -0
dos/guard.py +215 -0
dos/health.py +552 -0
dos/help_summary.py +519 -0
dos/home.py +934 -0
dos/hook_binary.py +194 -0
dos/hook_dialect.py +271 -0
dos/hook_exit.py +191 -0
dos/hook_install.py +437 -0
dos/id_alloc.py +304 -0
dos/improve.py +499 -0
dos/intent_ledger.py +635 -0
dos/interpret.py +176 -0
dos/intervention.py +769 -0
dos/intervention_eval.py +371 -0
dos/journal_delta.py +308 -0
dos/judge_eval.py +328 -0
dos/judges.py +366 -0
dos/lane_infer.py +127 -0
dos/lane_journal.py +1001 -0
dos/lane_lease.py +952 -0
dos/lane_overlap.py +228 -0
dos/lease_health.py +282 -0
dos/lifecycle.py +211 -0
dos/liveness.py +352 -0
dos/lock_modes.py +185 -0
dos/log_source.py +395 -0
dos/loop_decide.py +1746 -0
dos/marker_gate.py +254 -0
dos/marker_sensor.py +396 -0
dos/noop_streak.py +280 -0
dos/notify.py +479 -0
dos/observe.py +175 -0
dos/oracle.py +1661 -0
dos/overlap_eval.py +214 -0
dos/overlap_policy.py +342 -0
dos/packet_sidecar.py +267 -0
dos/phase_shipped.py +1985 -0
dos/pick_priority.py +225 -0
dos/pickable.py +369 -0
dos/picker_oracle.py +1037 -0
dos/plan_board.py +513 -0
dos/plan_board_tui.py +113 -0
dos/plan_source.py +455 -0
dos/posttool_sensor.py +528 -0
dos/precursor_gate.py +499 -0
dos/precursor_gate_eval.py +239 -0
dos/preflight.py +825 -0
dos/pretool_sensor.py +490 -0
dos/proc_delta.py +181 -0
dos/productivity.py +296 -0
dos/provider_limit.py +242 -0
dos/py.typed +4 -0
dos/reason_morphology.py +299 -0
dos/reasons.py +449 -0
dos/reconcile.py +173 -0
dos/recurring_wedge.py +206 -0
dos/render.py +393 -0
dos/result_state.py +468 -0
dos/resume.py +578 -0
dos/resume_evidence.py +293 -0
dos/retention.py +344 -0
dos/reward.py +372 -0
dos/rewind.py +587 -0
dos/rewind_evidence.py +168 -0
dos/rewind_tokens.py +252 -0
dos/run_id.py +342 -0
dos/scope.py +520 -0
dos/scope_source.py +382 -0
dos/scout.py +982 -0
dos/self_modify.py +209 -0
dos/sibling_scan.py +569 -0
dos/skills/EXAMPLES.md +584 -0
dos/skills/dos-class-cycle/SKILL.md +107 -0
dos/skills/dos-dispatch/SKILL.md +177 -0
dos/skills/dos-dispatch-loop/SKILL.md +254 -0
dos/skills/dos-goal-gate/SKILL.md +269 -0
dos/skills/dos-next-up/SKILL.md +231 -0
dos/skills/dos-promote/SKILL.md +114 -0
dos/skills/dos-replan/SKILL.md +159 -0
dos/skills/dos-replan-loop/SKILL.md +114 -0
dos/skills/dos-self-improve/SKILL.md +213 -0
dos/skills/dos-supervise-loop/SKILL.md +180 -0
dos/skills/dos-unstick/SKILL.md +108 -0
dos/skills/dos-witness-claim/SKILL.md +251 -0
dos/stamp.py +1002 -0
dos/state_health.py +387 -0
dos/status.py +114 -0
dos/stop_policy.py +334 -0
dos/supervise.py +1014 -0
dos/testwitness.py +392 -0
dos/timeline.py +1027 -0
dos/tokens.py +485 -0
dos/tool_stream.py +393 -0
dos/tool_stream_eval.py +226 -0
dos/trace.py +524 -0
dos/verdict.py +140 -0
dos/verdict_cli.py +189 -0
dos/verdict_journal.py +497 -0
dos/verdict_rollup.py +217 -0
dos/verdicts.py +181 -0
dos/wedge_reason.py +282 -0
dos_kernel-0.22.0.dist-info/METADATA +859 -0
dos_kernel-0.22.0.dist-info/RECORD +178 -0
dos_kernel-0.22.0.dist-info/WHEEL +5 -0
dos_kernel-0.22.0.dist-info/entry_points.txt +39 -0
dos_kernel-0.22.0.dist-info/licenses/LICENSE +21 -0
dos_kernel-0.22.0.dist-info/top_level.txt +2 -0
dos_mcp/__init__.py +52 -0
dos_mcp/py.typed +2 -0
dos_mcp/server.py +779 -0

dos/noop_streak.py ADDED Viewed

@@ -0,0 +1,280 @@
+"""NOS — the no-op-streak verdict: *how many turns in a row produced zero ground-truth delta?*
+docs/259 §Follow-up 1 — the **generalization of the wait-marker budget** off its one
+special case ("markers emitted") onto the general one ("no-op turns since the last
+forward delta"). `loop_decide.wait_marker_budget` already answers a count-vs-cap
+question for ONE flavor of no-op turn: a `claude -p` keep-alive marker — a full
+assistant turn that replays the whole context out of cache and produces nothing but
+"still waiting." But a `ScheduleWakeup`-poll loop that re-reads a `.output` file in a
+tight tick, or any loop that wakes, finds no change, and goes back to sleep, is the
+*same* pathology: a turn that paid the cache-replay cost and moved no ground truth.
+This module is the verdict that makes those one verdict — "the run has taken N no-op
+turns since it last made a forward delta; has it spent its budget?"
+This is `wait_marker_budget`'s **generalization**, and it sits in the temporal-verdict
+family (`liveness` / `tool_stream` / `productivity` / **`noop_streak`**) — the same
+pure-verdict shape, re-aimed once more:
+    liveness.classify     (ProgressEvidence, policy)  -> LivenessVerdict   (did state move AT ALL?)
+    tool_stream.classify_stream (ToolStream, policy)  -> StreamVerdict     (is the tool stream repeating?)
+    productivity.classify  (WorkHistory, policy)       -> ProductivityVerdict (is the work-RATE fading?)
+    noop_streak.classify   (NoOpHistory, policy)       -> NoOpStreakVerdict (how many no-op turns since a forward delta?)
+                           ^ THIS module
+It is a COUNT-vs-cap verdict, not a TREND verdict — which is why it is `wait_marker_budget`'s
+sibling and NOT a second mode of `productivity`. `productivity` reads a *vector* of
+per-step work magnitudes and asks "is the rate falling" (`deltas[-1]`/`deltas[-2]`);
+`noop_streak` reads a *single* monotone counter — the run-length of consecutive
+no-op turns since the last forward delta — and asks "is that run-length past its
+budget." Folding the streak into `productivity.WorkHistory` would overload its
+well-defined "fading rate" semantics with a different question and collide its
+"withhold the accusation / reject negatives" floor with this guard's opposite
+conservative direction (below). So the streak gets its own small verdict, the way
+`productivity` got its own rather than living inside `liveness`.
+**The forward-delta reset is the load-bearing idea** (docs/259 §Follow-up 2). The
+count is not "no-op turns ever" — it is "no-op turns *since the last forward delta*."
+A forward delta (a commit, a real tool result, a host re-entering a fresh wait phase)
+ZEROES the streak, the `tool_stream` ADVANCING analogue: progress earns the loop a
+fresh budget. Without a reset the count is a strict lifetime monotone (what
+`wait_marker_budget` is today); with one, a long-lived session that legitimately
+makes progress and then re-enters a wait phase starts fresh instead of being refused
+on a stale tally. The reset lives at the BOUNDARY (`marker_sensor.record_reset`
+appends an `op:"RESET"` record; the replayed count is markers-after-the-last-reset);
+this pure verdict just reads the resulting count.
+**Byte-clean by construction.** A no-op turn is a turn the *runtime* observed to
+produce zero ground-truth delta — it is counted by the durable accumulator
+(`marker_sensor`), never threaded through the agent's own narration. So EXHAUSTED is
+"the environment recorded N no-op turns since the last forward delta," never "the
+agent says it has waited long enough" — a quantity, not a self-report (the docs/138
+invariant `liveness`/`productivity`/`tool_stream` all keep).
+**Advisory.** Like `wait_marker_budget` and `liveness.SPINNING`, EXHAUSTED REPORTS;
+it never kills a process. A loop consults it and chooses to stop holding its turn
+open (the marker hook is the first consumer — it blocks the Stop while the budget is
+LIVE, allows the Stop once EXHAUSTED); nothing here enforces.
+**The conservative direction is the OPPOSITE of `productivity`'s** — and that is why
+it is a separate verdict. `productivity` withholds the DIMINISHING accusation when in
+doubt (a missing delta is "still productive"). A *cost* guard must do the reverse:
+when in doubt, count the no-op turn (so the guard refuses one *more* keep-alive turn,
+never one *fewer*) — over-spending on a missed count is the failure to avoid. The
+accumulator honors this by leaving a torn/unreadable RESET as "the reset didn't
+happen" (the count stays HIGHER → EXHAUSTED sooner → refuse more); this verdict
+honors it by treating `noop_turns >= max_streak` as EXHAUSTED (the `>=`, not `>`, so
+the budget is spent the instant it is reached). Refusing one no-op turn too early
+costs at most one missed poll; the real Bash `<task-notification>` (which fires on
+the child's true exit regardless) is the safety net.
+**No-telemetry / no-plan discipline** (the `test_verify_no_plan` sibling): NOS needs
+*nothing* but the no-op-turn count the caller already replayed. No plan, no registry,
+no clock — `classify()` makes no I/O at all (it is timeless, like `productivity`; it
+reads a count, not an age). A caller with a count gets a verdict; a caller with 0 gets
+the honest LIVE floor (a fresh wait phase has spent nothing yet).
+"""
+from __future__ import annotations
+import enum
+from dataclasses import dataclass
+from pathlib import Path
+class NoOpStreak(str, enum.Enum):
+    """The typed no-op-streak verdict — two states, mutually exclusive.
+    `str`-valued so it round-trips through a CLI stdout token / exit-code map without
+    a lookup table (mirrors `liveness.Liveness` / `productivity.Productivity` /
+    `gate_classify.Verdict`).
+    """
+    LIVE = "LIVE"            # the streak is under the cap — another no-op turn is permitted
+    EXHAUSTED = "EXHAUSTED"  # the streak has reached the cap — refuse further no-op turns
+    def __str__(self) -> str:  # pragma: no cover - trivial
+        return self.value
+@dataclass(frozen=True)
+class NoOpStreakPolicy:
+    """The cap that separates LIVE / EXHAUSTED — policy, not mechanism.
+    The same "mechanism is kernel, threshold is config" split as `productivity`'s
+    floor and `loop_decide`'s `max_iterations`. The default is GENERIC and equals
+    `wait_marker_budget`'s default (4) — so the generalized verdict refuses at the
+    same budget the shipped marker lever does (the marker case is the special case,
+    and it must not drift). A workspace declares its own in `dos.toml [noop_streak]`,
+    the closed-config-as-data pattern (`[tool_stream]` / `[productivity]` / `[stamp]`).
+      max_streak — the **no-op-turn budget since the last forward delta**: the most
+                   consecutive zero-delta turns a loop may take before the verdict
+                   refuses the next one. `wait_marker_budget`'s `max_markers`,
+                   generalized off "markers" onto "no-op turns." A streak that REACHES
+                   this cap (`>=`, the cost-guard direction) is EXHAUSTED.
+    Default: 4 — `wait_marker_budget`'s per-run cap, one below the `keepalive_poll`
+    telemetry flag (>=5), so the runtime refusal lands one turn before the post-hoc
+    alarm would fire.
+    """
+    max_streak: int = 4
+    def __post_init__(self) -> None:
+        if self.max_streak < 0:
+            raise ValueError("max_streak must be non-negative")
+DEFAULT_POLICY = NoOpStreakPolicy()
+@dataclass(frozen=True)
+class NoOpHistory:
+    """The no-op-turn count `classify()` reads — gathered by the CALLER at the boundary.
+    No clock, no I/O inside the verdict — the arbiter rule, sharpened: NOS is
+    *timeless* (it reads a count, never an age). The caller's boundary
+    (`marker_sensor.marker_count`, which replays the session's `.dos/markers/<sid>.jsonl`
+    tally into markers-since-the-last-RESET) measures the streak and freezes it here.
+      noop_turns — the count of no-op turns SINCE the last forward-delta reset. A
+                   no-op turn is a turn the runtime observed to produce zero ground-truth
+                   delta (today: one keep-alive wait-marker; the generalization also
+                   admits a poll-tick that found no change). 0 is "a fresh wait phase,
+                   nothing spent yet" — the LIVE floor. Negative is rejected: a streak
+                   length is a non-negative count.
+    The single load-bearing read is `noop_turns` vs the policy's `max_streak` — the
+    same count-vs-cap `wait_marker_budget(markers_emitted, max_markers)` makes. The
+    count is carried (not just a bool) so `--output json` can echo it and the verdict
+    can hand back the incremented value to carry into the next decision.
+    """
+    noop_turns: int = 0
+    def __post_init__(self) -> None:
+        if self.noop_turns < 0:
+            raise ValueError("noop_turns must be non-negative (a count of no-op turns)")
+    @classmethod
+    def of(cls, noop_turns: int) -> "NoOpHistory":
+        """Build a history from a replayed no-op-turn count."""
+        return cls(noop_turns)
+@dataclass(frozen=True)
+class NoOpStreakVerdict:
+    """The single verdict `classify()` returns, with the count echoed back.
+    `verdict` is the typed `NoOpStreak`. `allow` is the convenience bit the marker
+    hook keys on (`allow == (verdict is NoOpStreak.LIVE)`): True to permit one more
+    no-op turn, False to refuse it. `noop_turns` is the count to carry into the *next*
+    decision — incremented when allowed (this no-op turn now happened), unchanged when
+    refused (the refused turn did not happen) — byte-mirroring
+    `WaitMarkerDecision.markers_emitted`. `reason` is operator-facing. `to_dict` is the
+    json shape (the legible-distrust renderer seam: the operator sees not just
+    EXHAUSTED but the count and cap behind it).
+    """
+    verdict: NoOpStreak
+    allow: bool
+    noop_turns: int
+    reason: str
+    def to_dict(self) -> dict:
+        return {
+            "verdict": self.verdict.value,
+            "allow": self.allow,
+            "noop_turns": self.noop_turns,
+            "reason": self.reason,
+        }
+def classify(
+    history: NoOpHistory, policy: NoOpStreakPolicy = DEFAULT_POLICY
+) -> NoOpStreakVerdict:
+    """Classify a run's no-op streak against its budget. PURE — no I/O.
+    The `wait_marker_budget` arithmetic, generalized: a count vs a cap, with the
+    cost-guard `>=` (the budget is spent the instant it is reached, not one past).
+      * EXHAUSTED (refuse) — `noop_turns >= max_streak`: the run has taken its whole
+        budget of no-op turns since the last forward delta. The next one would replay
+        full context out of cache for no work; refuse it (the loop ends its turn and
+        waits on the real completion signal). The count carried forward is UNCHANGED
+        (a refused turn did not happen).
+      * LIVE (allow) — `noop_turns < max_streak`: budget remains; permit one more no-op
+        turn and carry `noop_turns + 1` (this turn now happened) into the next decision.
+    A `max_streak == 0` policy refuses the FIRST no-op turn (`0 >= 0`) — the degenerate
+    `wait_marker_budget(0, 0)` preserves, and the honest reading of "no budget at all."
+    """
+    if history.noop_turns >= policy.max_streak:
+        return NoOpStreakVerdict(
+            verdict=NoOpStreak.EXHAUSTED,
+            allow=False,
+            noop_turns=history.noop_turns,
+            reason=(
+                f"no-op streak budget exhausted "
+                f"({history.noop_turns}/{policy.max_streak} no-op turns since the last "
+                f"forward delta) — each further turn replays full context out of cache "
+                f"for no work; wait on the real completion signal, a forward delta resets "
+                f"the streak"
+            ),
+        )
+    return NoOpStreakVerdict(
+        verdict=NoOpStreak.LIVE,
+        allow=True,
+        noop_turns=history.noop_turns + 1,
+        reason=(
+            f"no-op streak {history.noop_turns + 1}/{policy.max_streak} since the last "
+            f"forward delta — budget remains"
+        ),
+    )
+# ---------------------------------------------------------------------------
+# The declarative on-ramp — read a policy out of dos.toml (mirror tool_stream/productivity).
+# ---------------------------------------------------------------------------
+def policy_from_table(table: dict) -> NoOpStreakPolicy:
+    """Turn a parsed `[noop_streak]` TOML table into a `NoOpStreakPolicy`. PURE (no I/O).
+    `table` is `{max_streak?}` — the shape `tomllib.load(...)["noop_streak"]` yields. A
+    missing key falls back to the generic default; a malformed value raises (via
+    `NoOpStreakPolicy.__post_init__`), so a bad declaration fails loudly at load (the
+    `tool_stream.policy_from_table` posture).
+    """
+    if not table:
+        return DEFAULT_POLICY
+    return NoOpStreakPolicy(
+        max_streak=int(table.get("max_streak", DEFAULT_POLICY.max_streak)),
+    )
+def load_from_toml(
+    path: "Path | str", *, base: NoOpStreakPolicy = DEFAULT_POLICY
+) -> NoOpStreakPolicy:
+    """Build a `NoOpStreakPolicy` from a `dos.toml`'s `[noop_streak]` table.
+    Returns `base` unchanged when the file is absent, has no `[noop_streak]` table, or
+    `tomllib` is unavailable — the declarative path is purely additive, so a missing/empty
+    config degrades to the generic default, never an error (the `tool_stream.load_from_toml`
+    contract). A *present but malformed* table raises (`NoOpStreakPolicy.__post_init__`).
+    Reads with `utf-8-sig` to strip a PowerShell-written BOM (the
+    `reasons`/`intervention`/`tool_stream` `load_from_toml` fix).
+    """
+    p = Path(path)
+    if not p.exists():
+        return base
+    try:
+        import tomllib  # py3.11+
+    except ModuleNotFoundError:  # pragma: no cover - py<3.11 fallback
+        try:
+            import tomli as tomllib  # type: ignore
+        except ModuleNotFoundError:
+            return base
+    data = tomllib.loads(p.read_text(encoding="utf-8-sig"))
+    table = data.get("noop_streak")
+    if not isinstance(table, dict) or not table:
+        return base
+    return policy_from_table(table)