RubyGems - rubino-agent - Versions diffs - 0.3.0 → 0.5.0 - Mend

rubino-agent 0.3.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

checksums.yaml +4 -4
data/.rubocop_todo.yml +11 -2
data/AGENTS.md +1 -1
data/CHANGELOG.md +172 -5
data/CONTRIBUTING.md +10 -1
data/README.md +14 -5
data/Rakefile +31 -0
data/docs/agents.md +42 -23
data/docs/architecture.md +2 -2
data/docs/commands.md +35 -3
data/docs/configuration.md +20 -23
data/docs/getting-started.md +5 -3
data/docs/security.md +16 -5
data/docs/skills.md +31 -0
data/docs/troubleshooting.md +1 -1
data/exe/rubino +16 -2
data/install.sh +721 -59
data/lib/rubino/active_agent.rb +73 -0
data/lib/rubino/agent/action_claim_guard.rb +881 -0
data/lib/rubino/agent/agent_registry.rb +5 -2
data/lib/rubino/agent/definition.rb +1 -9
data/lib/rubino/agent/fallback_chain.rb +0 -6
data/lib/rubino/agent/iteration_budget.rb +109 -3
data/lib/rubino/agent/loop.rb +476 -20
data/lib/rubino/agent/model_call_runner.rb +81 -3
data/lib/rubino/agent/prompts/build.txt +22 -5
data/lib/rubino/agent/response_validator.rb +8 -0
data/lib/rubino/agent/runner.rb +133 -8
data/lib/rubino/agent/tool_executor.rb +166 -14
data/lib/rubino/agent/truncation_continuation.rb +4 -1
data/lib/rubino/api/server.rb +19 -0
data/lib/rubino/attachments/classify.rb +35 -17
data/lib/rubino/boot/config_guard.rb +71 -0
data/lib/rubino/cli/chat/completion_builder.rb +42 -6
data/lib/rubino/cli/chat/idle_card_host.rb +7 -1
data/lib/rubino/cli/chat/session_resolver.rb +87 -21
data/lib/rubino/cli/chat_command.rb +1189 -50
data/lib/rubino/cli/commands.rb +282 -2
data/lib/rubino/cli/config_command.rb +68 -8
data/lib/rubino/cli/doctor_command.rb +204 -12
data/lib/rubino/cli/jobs_command.rb +12 -0
data/lib/rubino/cli/memory_command.rb +53 -20
data/lib/rubino/cli/onboarding_wizard.rb +79 -6
data/lib/rubino/cli/session_command.rb +172 -18
data/lib/rubino/cli/setup_command.rb +131 -8
data/lib/rubino/cli/skills_command.rb +183 -9
data/lib/rubino/cli/trust_gate.rb +16 -7
data/lib/rubino/commands/built_ins.rb +2 -0
data/lib/rubino/commands/command.rb +12 -2
data/lib/rubino/commands/executor.rb +149 -12
data/lib/rubino/commands/handlers/agent_switch.rb +100 -0
data/lib/rubino/commands/handlers/agents.rb +156 -41
data/lib/rubino/commands/handlers/config.rb +4 -1
data/lib/rubino/commands/handlers/help.rb +113 -14
data/lib/rubino/commands/handlers/memory.rb +15 -5
data/lib/rubino/commands/handlers/sessions.rb +26 -3
data/lib/rubino/commands/handlers/status.rb +9 -4
data/lib/rubino/commands/loader.rb +12 -0
data/lib/rubino/config/configuration.rb +86 -24
data/lib/rubino/config/defaults.rb +140 -33
data/lib/rubino/config/loader.rb +62 -12
data/lib/rubino/config/validator.rb +341 -0
data/lib/rubino/config/writer.rb +123 -31
data/lib/rubino/context/compressor.rb +184 -22
data/lib/rubino/context/environment_inspector.rb +2 -2
data/lib/rubino/context/file_discovery.rb +2 -2
data/lib/rubino/context/message_boundary.rb +27 -1
data/lib/rubino/context/project_languages.rb +90 -0
data/lib/rubino/context/prompt_assembler.rb +105 -22
data/lib/rubino/context/summary_builder.rb +45 -4
data/lib/rubino/context/token_budget.rb +36 -11
data/lib/rubino/context/token_estimate.rb +45 -0
data/lib/rubino/context/tool_result_pruner.rb +81 -0
data/lib/rubino/database/connection.rb +154 -3
data/lib/rubino/database/migrations/001_create_initial_schema.rb +314 -40
data/lib/rubino/database/migrator.rb +98 -5
data/lib/rubino/documents/cap_exceeded.rb +13 -0
data/lib/rubino/documents/converters/csv.rb +4 -3
data/lib/rubino/documents/converters/docx.rb +29 -5
data/lib/rubino/documents/converters/html.rb +5 -1
data/lib/rubino/documents/converters/json.rb +2 -1
data/lib/rubino/documents/converters/pdf.rb +11 -2
data/lib/rubino/documents/converters/plain.rb +2 -1
data/lib/rubino/documents/converters/pptx.rb +11 -2
data/lib/rubino/documents/converters/xlsx.rb +35 -4
data/lib/rubino/documents/converters/xml.rb +2 -1
data/lib/rubino/documents/limits.rb +210 -0
data/lib/rubino/documents.rb +10 -3
data/lib/rubino/errors.rb +36 -5
data/lib/rubino/interaction/cancel_token.rb +19 -3
data/lib/rubino/interaction/events.rb +13 -0
data/lib/rubino/interaction/lifecycle.rb +99 -13
data/lib/rubino/interaction/polishing.rb +176 -0
data/lib/rubino/jobs/cron_job_repository.rb +5 -8
data/lib/rubino/jobs/handlers/cleanup_sessions_job.rb +11 -0
data/lib/rubino/jobs/handlers/distill_skill_job.rb +65 -9
data/lib/rubino/jobs/queue.rb +63 -8
data/lib/rubino/jobs/runner.rb +24 -6
data/lib/rubino/jobs/worker.rb +0 -4
data/lib/rubino/llm/adapter_response.rb +47 -4
data/lib/rubino/llm/credential_check.rb +15 -16
data/lib/rubino/llm/error_classifier.rb +89 -1
data/lib/rubino/llm/inline_think_filter.rb +69 -12
data/lib/rubino/llm/request.rb +30 -3
data/lib/rubino/llm/ruby_llm_adapter.rb +394 -46
data/lib/rubino/llm/tool_bridge.rb +113 -9
data/lib/rubino/mcp/manager.rb +18 -1
data/lib/rubino/mcp/mcp_tool_wrapper.rb +14 -3
data/lib/rubino/memory/aux_retry.rb +107 -0
data/lib/rubino/memory/backends/sqlite.rb +73 -44
data/lib/rubino/memory/backends.rb +23 -7
data/lib/rubino/memory/salience_gate.rb +103 -0
data/lib/rubino/memory/sqlite_extraction.rb +70 -0
data/lib/rubino/memory/sqlite_extraction_prompt.rb +11 -0
data/lib/rubino/memory/store.rb +33 -5
data/lib/rubino/memory/threat_scanner.rb +52 -0
data/lib/rubino/output/cost.rb +52 -0
data/lib/rubino/output/headless_block_latch.rb +53 -0
data/lib/rubino/output/result_serializer.rb +222 -0
data/lib/rubino/output/turn_recorder.rb +77 -0
data/lib/rubino/security/approval_policy.rb +227 -32
data/lib/rubino/security/command_allowlist.rb +79 -4
data/lib/rubino/security/doom_loop_detector.rb +21 -2
data/lib/rubino/security/hardline_guard.rb +189 -16
data/lib/rubino/security/pattern_matcher.rb +28 -5
data/lib/rubino/security/prefix_deriver.rb +25 -6
data/lib/rubino/security/readonly_commands.rb +145 -5
data/lib/rubino/security/secret_path.rb +134 -0
data/lib/rubino/security/url_safety.rb +255 -0
data/lib/rubino/session/repository.rb +212 -11
data/lib/rubino/session/store.rb +139 -14
data/lib/rubino/skills/installer.rb +230 -0
data/lib/rubino/skills/prompt_index.rb +2 -2
data/lib/rubino/skills/registry.rb +52 -1
data/lib/rubino/skills/skill.rb +64 -3
data/lib/rubino/skills/skill_tool.rb +16 -5
data/lib/rubino/tools/background_tasks.rb +157 -13
data/lib/rubino/tools/base.rb +204 -3
data/lib/rubino/tools/edit_tool.rb +73 -18
data/lib/rubino/tools/glob_tool.rb +48 -9
data/lib/rubino/tools/grep_tool.rb +103 -9
data/lib/rubino/tools/multi_edit_tool.rb +64 -9
data/lib/rubino/tools/patch_tool.rb +5 -0
data/lib/rubino/tools/read_attachment_tool.rb +3 -1
data/lib/rubino/tools/read_tool.rb +33 -15
data/lib/rubino/tools/read_tracker.rb +153 -35
data/lib/rubino/tools/registry.rb +113 -12
data/lib/rubino/tools/result.rb +9 -1
data/lib/rubino/tools/ruby_tool.rb +0 -0
data/lib/rubino/tools/shell_registry.rb +70 -0
data/lib/rubino/tools/shell_tool.rb +40 -1
data/lib/rubino/tools/summarize_file_tool.rb +6 -0
data/lib/rubino/tools/task_stop_tool.rb +10 -16
data/lib/rubino/tools/task_tool.rb +36 -8
data/lib/rubino/tools/vision_tool.rb +5 -0
data/lib/rubino/tools/webfetch_tool.rb +39 -7
data/lib/rubino/tools/websearch_tool.rb +92 -30
data/lib/rubino/tools/write_tool.rb +23 -4
data/lib/rubino/ui/api.rb +10 -1
data/lib/rubino/ui/base.rb +11 -0
data/lib/rubino/ui/bottom_composer.rb +382 -74
data/lib/rubino/ui/cli.rb +515 -83
data/lib/rubino/ui/completion_menu.rb +11 -7
data/lib/rubino/ui/headless_trace.rb +63 -0
data/lib/rubino/ui/live_region.rb +70 -7
data/lib/rubino/ui/markdown_renderer.rb +142 -7
data/lib/rubino/ui/notifier.rb +0 -2
data/lib/rubino/ui/null.rb +52 -5
data/lib/rubino/ui/paste_store.rb +16 -2
data/lib/rubino/ui/queued_indicators.rb +6 -1
data/lib/rubino/ui/status_bar.rb +61 -7
data/lib/rubino/ui/streaming_markdown.rb +59 -6
data/lib/rubino/ui/subagent_view.rb +29 -4
data/lib/rubino/ui/tool_label.rb +52 -0
data/lib/rubino/update_check.rb +39 -4
data/lib/rubino/util/atomic_file.rb +117 -0
data/lib/rubino/util/ignore_rules.rb +120 -0
data/lib/rubino/util/output.rb +229 -12
data/lib/rubino/util/secrets_mask.rb +70 -7
data/lib/rubino/util/spill_store.rb +153 -0
data/lib/rubino/version.rb +1 -1
data/lib/rubino/workspace.rb +9 -1
data/lib/rubino.rb +191 -7
data/rubino-agent.gemspec +1 -0
data/skills/ruby-expert/SKILL.md +1 -0
metadata +42 -12
data/lib/rubino/agent/router.rb +0 -65
data/lib/rubino/database/migrations/002_create_runs.rb +0 -45
data/lib/rubino/database/migrations/003_create_skill_states.rb +0 -15
data/lib/rubino/database/migrations/004_create_cron_jobs.rb +0 -36
data/lib/rubino/database/migrations/005_create_oauth_connections.rb +0 -27
data/lib/rubino/database/migrations/006_create_webhook_deliveries.rb +0 -34
data/lib/rubino/database/migrations/007_create_messages_fts.rb +0 -59
data/lib/rubino/database/migrations/008_create_memory_facts.rb +0 -75
data/lib/rubino/database/migrations/009_create_memory_graph.rb +0 -55
data/lib/rubino/database/migrations/010_add_owner_pid_to_sessions.rb +0 -20

data/lib/rubino/agent/action_claim_guard.rb ADDED Viewed

@@ -0,0 +1,881 @@
+# frozen_string_literal: true
+module Rubino
+  module Agent
+    # Closes the #1 trust-killer: the model ENDS a turn asserting it did or will
+    # do something ("Running the tests now", "Saved the file", "Changed
+    # directory") with ZERO tool calls, so a fabricated success reaches the user.
+    #
+    # The structured tool-call channel is the ONLY thing that advances state. A
+    # text-only turn whose prose claims an action against a tool rubino exposes
+    # is, by construction, a claim with nothing behind it. We do not trust it.
+    #
+    # Two intents, two outcomes:
+    #
+    #   1. cd / "change directory" — rubino has NO cd tool, so the claim can NEVER
+    #      be true. We do not reflect (a reflection would just invite the model to
+    #      claim it again); we REWRITE the final answer with an honest message
+    #      explaining how to actually change the workspace (/add-dir or relaunch).
+    #
+    #   2. any other action verb (run/test/save/write/edit/create/delete/move…)
+    #      mapped to a tool rubino DOES expose — we REFLECT one corrective turn
+    #      ("you said you would <X> but issued no tool call; call the tool now or
+    #      say you cannot and why"), capped at MAX_REFLECTIONS (aider's
+    #      reflected_message pattern, capped). After the cap the guard becomes
+    #      BINDING: it REPLACES the fabricated final answer with a deterministic
+    #      honest message rather than letting the model's "done" reach the user
+    #      (G1). The structured tool-call channel is the only thing that advances
+    #      state, so a terminal turn that still asserts a mutation with zero tool
+    #      calls has, by construction, changed nothing — and we say exactly that.
+    #
+    #   3. a tool was DENIED or BLOCKED this turn (user-denied, or headless
+    #      fail-closed "needs approval but no interactive session"), and the model
+    #      then narrates success OR hands back a fabricated unified diff/patch for
+    #      files it never wrote (F1/F2). The action did NOT happen, so the diff is
+    #      not a real artifact; we REPLACE the answer with the honest "that was
+    #      blocked — nothing was applied; pass --yolo (or approve interactively)"
+    #      so a plausible-looking but partly-invented diff can never stand as if
+    #      real and get `git apply`-ed.
+    #
+    #   4. the INVERSE (#381, PESSIMISTIC fabrication): a turn that ACTUALLY ran
+    #      tools (often a budget/rate-limit exhausted turn whose forced summary the
+    #      model writes pessimistically) ends with a confident claim that NOTHING
+    #      happened — "I have not read a single file, not run grep, not made any
+    #      edits" — even though the ledger shows N tool calls and real edits on
+    #      disk. Letting that stand makes a developer believe no work was done and
+    #      miss correct, uncommitted changes. The harness — not the narration — is
+    #      the authority on side-effects (the same principle as 1–3, mirrored): when
+    #      the final answer asserts no/zero actions yet the tool-call ledger shows
+    #      tools DID run, we RECONCILE it with a truthful harness note ("N tool
+    #      calls ran this turn (M edits — review uncommitted changes)"). This path
+    #      is the ONLY one that fires when tool_count > 0; it keys on the ledger, not
+    #      on exact wording, so it stays model-agnostic.
+    #
+    # Deliberately conservative — it must never nag a legitimate text answer:
+    #   * Only fires when the WHOLE turn ran zero tools AND zero denied tools.
+    #     A turn that ran (or had denied) any tool is the model acting/recovering,
+    #     not fabricating; its closing prose is a real summary.
+    #   * The verb must be asserted as the assistant's OWN action in the
+    #     present-progressive / just-completed / immediate-future ("I'll run…",
+    #     "Running…", "I ran…", "Saved…", "Done — created…"), not described
+    #     ("you can run…", "to run the tests…", "the test command is…").
+    #   * A turn that ASKS the user something (ends on a question) is a legitimate
+    #     clarify, not a fabricated completion — left alone.
+    class ActionClaimGuard
+      # Absolute ceiling on corrective turns. After this many the guard becomes
+      # BINDING (G1): it stops re-prompting and surfaces an honest deterministic
+      # message rather than loop forever against a model that won't call the tool.
+      #
+      # Lowered from 3 → 2: three accumulated identical "you lied, nothing
+      # happened" challenges drove the model into a confession spiral — it stopped
+      # acting and started confabulating false histories / pre-emptively
+      # apologising, and a legitimate steering change got stranded for 3 turns
+      # (#353b). A fresh atomic instruction recovered the model, so the injected
+      # text was the aggravator. We now bind after 2, and the SECOND injection
+      # DECAYS to a short, non-accusatory atomic instruction (see
+      # #reflection_message) instead of repeating the heavy challenge — so the
+      # reflections cannot compound into an inescapable loop.
+      MAX_REFLECTIONS = 2
+      # After this many consecutive corrective injections the wording DECAYS to a
+      # short, atomic, non-accusatory instruction (a single concrete tool call to
+      # make) instead of re-injecting the full "nothing happened" challenge — the
+      # repeated heavy framing is what compounds into the confession spiral
+      # (#353b). The first challenge still names the fabrication in full.
+      DECAY_AFTER_REFLECTIONS = 1
+      # Verbs that imply a state-changing action the agent performs THROUGH a
+      # tool. Each maps to the tool name(s) that would actually carry it out, so
+      # we only reflect when rubino actually exposes a way to do the claimed
+      # thing (no point nagging "I searched the web" if web tools are disabled).
+      ACTION_TOOLS = {
+        "run" => %w[shell ruby test git github],
+        "ran" => %w[shell ruby test git github],
+        "execute" => %w[shell ruby],
+        "executed" => %w[shell ruby],
+        "test" => %w[test shell],
+        "tested" => %w[test shell],
+        "save" => %w[write edit multi_edit patch],
+        "saved" => %w[write edit multi_edit patch],
+        "write" => %w[write edit multi_edit patch],
+        "wrote" => %w[write edit multi_edit patch],
+        "edit" => %w[edit multi_edit write patch],
+        "edited" => %w[edit multi_edit write patch],
+        "create" => %w[write edit multi_edit],
+        "created" => %w[write edit multi_edit],
+        "delete" => %w[shell],
+        "deleted" => %w[shell],
+        "remove" => %w[edit multi_edit shell write],
+        "removed" => %w[edit multi_edit shell write],
+        "move" => %w[shell],
+        "moved" => %w[shell],
+        "rename" => %w[shell edit multi_edit],
+        "renamed" => %w[shell edit multi_edit],
+        "install" => %w[shell],
+        "installed" => %w[shell],
+        "commit" => %w[git shell],
+        "committed" => %w[git shell],
+        "push" => %w[git shell],
+        "pushed" => %w[git shell],
+        "fetch" => %w[web_fetch shell git],
+        "fetched" => %w[web_fetch shell git]
+      }.freeze
+      # File/state MUTATION verbs — the highest-cost class for a coding agent.
+      # A toolless turn that asserts ANY of these as the assistant's own past
+      # action ("Updated both methods", "Added the docstring", "I removed mode()")
+      # has, by construction, changed nothing on disk. Unlike the verbs above,
+      # these are matched ANYWHERE in the message (not just sentence-initial or
+      # inside a completion window) and PRIORITISED over a trailing future-intent
+      # verb, so a message that bundles a fabricated edit-claim with a "then I'll
+      # run the tests" is challenged on the EDIT, not on the trailing run. Each
+      # maps to the write-family tool(s) that would actually carry it out, so the
+      # claim is only challenged when rubino actually exposed a way to mutate.
+      MUTATION_TOOLS = {
+        "edited" => %w[edit multi_edit write patch],
+        "wrote" => %w[write edit multi_edit patch],
+        "written" => %w[write edit multi_edit patch],
+        "updated" => %w[edit multi_edit write patch],
+        "created" => %w[write edit multi_edit],
+        "added" => %w[edit multi_edit write patch],
+        "removed" => %w[edit multi_edit write patch shell],
+        "saved" => %w[write edit multi_edit patch],
+        "modified" => %w[edit multi_edit write patch],
+        "renamed" => %w[shell edit multi_edit],
+        "deleted" => %w[shell edit multi_edit write],
+        "applied" => %w[patch edit multi_edit write],
+        "changed" => %w[edit multi_edit write patch],
+        "replaced" => %w[write edit multi_edit patch],
+        "inserted" => %w[edit multi_edit write patch],
+        "appended" => %w[edit multi_edit write patch],
+        "fixed" => %w[edit multi_edit write patch]
+      }.freeze
+      # The assistant asserts a mutation as its OWN completed action — past-tense
+      # mutation verb in a first-person OR a bare/completion narration, ANYWHERE
+      # in the text. Built per-verb from MUTATION_TOOLS' keys (which are already
+      # the past/participle surface forms). Matches "I updated…", "I've added…",
+      # "Updated both methods", "Done. Added the docstring", "✓ wrote the file",
+      # "- removed mode()". Deliberately past-tense only: a bare future "I'll
+      # update…" with a real tool call is handled by tool_count > 0; a future
+      # intent with NO tool call is still a fabrication and is also caught here
+      # via the first-person future framing below.
+      # Three alternatives, no interspersed comments (a `#` mid-concatenation
+      # would break the `\` line-continuation into a bare `(?:`):
+      #   1. first-person past / completed — "I updated", "I've added",
+      #      "I just wrote", "we removed", "now i updated".
+      #   2. first-person immediate-future with NO tool call — still a
+      #      fabrication — "I'll update…", "let me add…", "I will write…".
+      #   3. bare sentence-initial / list-item / post-completion past form —
+      #      "Updated both methods", "Added the docstring", "Done. Wrote the
+      #      file", "✓ removed mode()", "- created config.rb".
+      MUTATION_SELF_SRC =
+        "(?:" \
+        '\b(?:i|we|i\s?\'?ve|we\s?\'?ve|i\s+have|we\s+have|i\s+just|now\s+i)\b' \
+        '\s+(?:just\s+|now\s+|already\s+|go\s+ahead\s+and\s+)?(VERB)\b' \
+        '|\b(?:i\s?\'?ll|i\s+will|let\s+me|i\s?\'?m\s+going\s+to|i\s+am\s+going\s+to|' \
+        'going\s+to|about\s+to)\b\s+(?:just\s+|now\s+|go\s+ahead\s+and\s+)?(VERBBASE)\b' \
+        '|(?:\A|[.!?\n]\s*|^[-*]\s*|' \
+        '(?:\b(?:done|finished|complete|completed|ok|okay)\b|✓|✅|all\s+(?:set|done))[^.!?\n]{0,30}?)' \
+        '(VERB)\b' \
+        ")"
+      # base form of each mutation verb (for the immediate-future framing above):
+      # "I'll update", "let me add". Keyed by the past form stored in
+      # MUTATION_TOOLS so the alternation stays in lockstep with the tool map.
+      MUTATION_BASE = {
+        "edited" => "edit", "wrote" => "write", "written" => "write",
+        "updated" => "update", "created" => "create", "added" => "add",
+        "removed" => "remove", "saved" => "save", "modified" => "modify",
+        "renamed" => "rename", "deleted" => "delete", "applied" => "apply",
+        "changed" => "change", "replaced" => "replace", "inserted" => "insert",
+        "appended" => "append", "fixed" => "fix"
+      }.freeze
+      # State-RESULT phrasing — a fabricated mutation dressed as a fact about the
+      # file/state rather than as an action verb: "README.md now contains 'API
+      # v2'", "the file now has the import", "X is now set to 5", "the contents
+      # now read …", "it now reflects the change". No action verb at all, so the
+      # verb-based matchers above miss it entirely (this was the r5c NEW-1 hole).
+      # We require a "now" + a state predicate so we don't trip on a plain
+      # description ("the file contains a bug"). Backed by the write-family tools.
+      STATE_RESULT = Regexp.new(
+        '\bnow\s+(?:contains|has|holds|includes|reads|reflects|shows|' \
+        'looks\s+like|points\s+to)\b' \
+        '|\b(?:is|are|reads)\s+now\s+(?:set\s+to|equal\s+to|)' \
+        '|\bnow\s+(?:set\s+to|equal\s+to)\b' \
+        '|\bthe\s+(?:file|contents?|method|function|class|line|import|' \
+        'docstring|code|config(?:uration)?)\b[^.!?\n]{0,40}?\bnow\b' \
+        '|\b(?:contents?|file|value|content)\b[^.!?\n]{0,30}?\b(?:is|are)\s+now\b',
+        Regexp::IGNORECASE
+      )
+      # Git-MUTATION RESULT phrasing — a fabricated VCS mutation narrated as a
+      # fact rather than a first-person/sentence-initial action verb. This is the
+      # exact G1 shape: "Done. New branch feature/tax … committed as 0f60f1d." —
+      # a bare "committed as <sha>", "created (the) branch X", "new branch X",
+      # "pushed to origin/X", "the commit is <sha>", "on branch X now". The
+      # action-verb matcher misses these (the verb is mid-sentence, no "I", and
+      # the completion marker is >20 chars away from the verb), so a hallucinated
+      # SHA/branch sailed through to the user. Gated on a git/shell tool being
+      # exposed (handled at the call site). A bare SHA on its own is NOT enough
+      # (too noisy) — we require a commit/branch/push CONTEXT around it.
+      GIT_RESULT = Regexp.new(
+        '\bcommitted\s+(?:as|in|with(?:\s+(?:sha|hash|id))?|to)\b' \
+        '|\b(?:created|made|added|cut)\s+(?:a\s+|the\s+|new\s+)*branch\b' \
+        '|\bnew\s+branch\b[^.!?\n]{0,60}?\b(?:committed|created|with\s+the)\b' \
+        '|\bbranch\b[^.!?\n]{0,40}?\bcommitted\s+as\b' \
+        '|\b(?:pushed|push(?:ed)?)\s+(?:it\s+)?to\s+(?:origin|remote|the\s+remote)\b' \
+        '|\bthe\s+commit\s+(?:is|hash\s+is|sha\s+is)\b' \
+        '|\b(?:commit|sha|hash)\s+(?:is\s+)?\b[0-9a-f]{7,40}\b',
+        Regexp::IGNORECASE
+      )
+      # Base/infinitive surface of a tracked action verb so the claim phrase
+      # ("commit that", "run that") fits both the reflection ("you'd <claim>")
+      # and the binding replacement ("I did not <claim>") templates. ACTION_TOOLS
+      # keys mix base ("run") and past ("ran", "committed") forms; map the past
+      # ones back to base, leave the rest as-is.
+      ACTION_BASE = {
+        "ran" => "run", "executed" => "execute", "tested" => "test",
+        "saved" => "save", "wrote" => "write", "edited" => "edit",
+        "created" => "create", "deleted" => "delete", "removed" => "remove",
+        "moved" => "move", "renamed" => "rename", "installed" => "install",
+        "committed" => "commit", "pushed" => "push", "fetched" => "fetch"
+      }.freeze
+      # The write-family tools any mutation/state-result claim needs on offer for
+      # the guard to challenge it — no point challenging "the file now contains X"
+      # if rubino has no way to write at all this turn.
+      WRITE_FAMILY = %w[write edit multi_edit patch].freeze
+      # The VCS tools a fabricated git-mutation RESULT ("committed as <sha>")
+      # needs on offer for the guard to challenge it.
+      GIT_TOOLS = %w[git github shell].freeze
+      # The text honestly reports the block instead of fabricating success —
+      # "it was blocked", "nothing was applied", "not run/applied", "wasn't run",
+      # "needs approval", "no interactive session". Lets a denied/blocked turn
+      # that owns up be surfaced as-is; a fabricated diff dressed in honest words
+      # is still caught by FABRICATED_DIFF (checked first).
+      BLOCKED_HONEST = Regexp.new(
+        '\b(?:was|were|is|got)\s+blocked\b' \
+        '|\bnothing\s+(?:was|were|got)?\s*(?:applied|changed|written|run|saved)\b' \
+        '|\bnot\s+(?:been\s+)?(?:applied|run|executed|saved|written|committed)\b' \
+        '|\b(?:was|were)n\s?\'?t\s+(?:applied|run|executed|saved|written|committed)\b' \
+        '|\bneeds?\s+approval\b' \
+        '|\bno\s+interactive\s+session\b',
+        Regexp::IGNORECASE
+      )
+      # base verb => [progressive, past] surface forms. Stored explicitly rather
+      # than derived so English irregulars (run→running→ran, write→writing→wrote)
+      # are correct. Fuels the bare-lead / completion-lead / first-person matches.
+      SURFACE_FORMS = {
+        "run" => %w[running ran], "ran" => %w[running ran],
+        "write" => %w[writing wrote], "wrote" => %w[writing wrote],
+        "save" => %w[saving saved], "saved" => %w[saving saved],
+        "edit" => %w[editing edited], "edited" => %w[editing edited],
+        "create" => %w[creating created], "created" => %w[creating created],
+        "delete" => %w[deleting deleted], "deleted" => %w[deleting deleted],
+        "remove" => %w[removing removed], "removed" => %w[removing removed],
+        "move" => %w[moving moved], "moved" => %w[moving moved],
+        "rename" => %w[renaming renamed], "renamed" => %w[renaming renamed],
+        "commit" => %w[committing committed], "committed" => %w[committing committed],
+        "push" => %w[pushing pushed], "pushed" => %w[pushing pushed],
+        "fetch" => %w[fetching fetched], "fetched" => %w[fetching fetched],
+        "install" => %w[installing installed], "installed" => %w[installing installed],
+        "execute" => %w[executing executed], "executed" => %w[executing executed],
+        "test" => %w[testing tested], "tested" => %w[testing tested]
+      }.freeze
+      # First-person assertion that the action is happening / happened / is about
+      # to happen — NOT a description offered to the user. We require one of these
+      # framings immediately around a tracked verb so "you can run the tests"
+      # never trips, but "I'll run the tests", "running the tests now",
+      # "I ran the tests", "saved the file" do.
+      #   subject framings: "i", "i'll", "i've", "i have", "let me", "i'm",
+      #                     "i am", "i will", "i just", "going to", "about to"
+      #   bare-progressive / bare-past at sentence start: "running…", "saved…"
+      #   "i'll RUN", "i RAN", "let me SAVE" — the VERB placeholder is filled per
+      #   call. Built from a String (not a regex literal) so the path/comment
+      #   slashes elsewhere in this file never collide with the regex delimiter.
+      FIRST_PERSON_VERB_SRC =
+        '(?:\b(?:i\s?\'?ll|i\s?\'?ve|i\s+have|i\s+will|i\s+just|i\s?\'?m|i\s+am|' \
+        'let\s+me|going\s+to|about\s+to|now\s+i|i)\b\s+' \
+        '(?:just\s+|now\s+|go\s+ahead\s+and\s+)?)(VERB)\w*'
+      # Bare sentence-initial progressive/past at the start, after a sentence end,
+      # or as a list item: "Running the suite now.", "Saved to foo.py and ran
+      # it.", "Created the file." — a common MiniMax-M3 narration with no "I".
+      BARE_LEAD_VERB_SRC = '(?:\A|[.!?\n]\s*|^[-*]\s*)(VERBING)\b'
+      # A completion marker ("done", "✓", "all set", "all done", "finished")
+      # immediately before a past/progressive verb form — "Done — created the
+      # file.", "✓ saved.", "All set, removed mode()." — is the model declaring
+      # the work finished. The verb may sit up to ~20 non-period chars after.
+      COMPLETION_LEAD_SRC =
+        '(?:\b(?:done|finished|complete|completed)\b|✓|✅|all\s+(?:set|done))' \
+        '[^.!?\n]{0,20}?\b(VERBING)\b'
+      # cd / change-directory intent. rubino has no cd tool, so ANY first-person
+      # claim to change the working directory is unfulfillable — handled
+      # separately (honest rewrite, never a reflection). "cd /path", "cd ~",
+      # "changed the working directory", "switched to the folder", "moved into".
+      CD_INTENT = Regexp.new(
+        "(?:" \
+        '\bcd\s+[~/.]' \
+        '|\bchang(?:e|ed|ing)\b[^.\n]{0,40}\b(?:working\s+)?(?:dir(?:ectory)?|cwd|folder|workspace)\b' \
+        '|\bswitch(?:ed|ing)?\b[^.\n]{0,40}\b(?:to\s+the\s+)?(?:dir(?:ectory)?|cwd|folder)\b' \
+        '|\bmov(?:e|ed|ing)\s+(?:in)?to\s+(?:the\s+)?[~.][\w./-]*' \
+        ")",
+        Regexp::IGNORECASE
+      )
+      # The LATEST user message explicitly requested a NO-ACTION turn — a plan,
+      # a list, an explanation, a recall-from-memory answer, or it forbade tools
+      # outright ("do not implement yet", "without using any tools", "answer from
+      # memory"). On such a turn the model is SUPPOSED to produce prose and call
+      # no tool, so its "here's the plan; I'll add X next" is the requested
+      # deliverable, NOT a fabricated "done" — challenging it makes the model
+      # apologise for obeying. We detect a small set of no-action intents and skip
+      # the claim-challenge for that turn. Deliberately narrow: a plain task
+      # request ("add the docstring", "run the tests") matches NONE of these, so
+      # the anti-fabrication core still fires on real task turns.
+      #
+      #   * explicit tool prohibition  — "do not / don't run|use|call … tool(s)",
+      #                                  "without (using) (any) tools", "no tools".
+      #   * answer-from-memory / recall — "from memory", "from what you know/recall",
+      #                                  "don't look it up", "without reading".
+      #   * plan / don't-implement-yet  — "don't implement (yet)", "just (the)
+      #                                  plan", "outline/list the plan/steps",
+      #                                  "plan only", "before you implement".
+      #   * explain/describe-only ask   — "just explain|describe|tell me|summarize",
+      #                                  "explanation only", "no code".
+      # NOTE: no interspersed comments inside this concatenation — a `#` would
+      # break the `\` line-continuation (same gotcha as CD_INTENT above). The four
+      # intent groups are, in order: (1) explicit tool prohibition; (2)
+      # answer-from-memory / recall / don't-look-up; (3) plan / don't-implement-yet;
+      # (4) explain/describe-only ask.
+      NO_ACTION_REQUEST = Regexp.new(
+        "(?:" \
+        '\b(?:do\s+not|don\s?\'?t|dont|please\s+do\s+not|please\s+don\s?\'?t)\b' \
+        '[^.!?\n]{0,30}?\b(?:run|use|call|invoke|execute|touch|edit|write|' \
+        'implement|change|modify)\b' \
+        '|\bwithout\s+(?:using\s+|running\s+|calling\s+|invoking\s+)?' \
+        '(?:any\s+)?(?:tools?|tool\s+calls?|the\s+tools?)\b' \
+        '|\bno\s+tools?\b|\bdon\s?\'?t\s+(?:use|call|run)\s+(?:any\s+)?tools?\b' \
+        '|\b(?:from|out\s+of)\s+(?:your\s+)?memory\b' \
+        '|\bfrom\s+(?:what\s+you\s+(?:know|recall|remember))\b' \
+        '|\b(?:answer|recall|tell\s+me)\b[^.!?\n]{0,30}?\bfrom\s+memory\b' \
+        '|\bwithout\s+(?:reading|looking\s+(?:it\s+)?up|searching|checking)\b' \
+        '|\bdon\s?\'?t\s+(?:look\s+(?:it\s+)?up|read|search|check)\b' \
+        '|\b(?:do\s+not|don\s?\'?t|dont)\b[^.!?\n]{0,20}?\bimplement\b' \
+        '|\bimplement\b[^.!?\n]{0,10}?\b(?:nothing|yet)\b' \
+        '|\bbefore\s+(?:you\s+)?implement(?:ing)?\b' \
+        '|\b(?:just|only)\b[^.!?\n]{0,20}?\bthe\s+plan\b' \
+        '|\bplan\s+only\b|\bonly\s+(?:the\s+)?plan\b' \
+        '|\b(?:outline|list|describe|sketch|propose|give\s+me|show\s+me)\b' \
+        '[^.!?\n]{0,30}?\b(?:plan|steps|approach|strategy)\b' \
+        '|\b(?:just|only|simply)\b[^.!?\n]{0,15}?\b(?:explain|describe|tell\s+me|' \
+        'summarize|summarise|outline)\b' \
+        '|\b(?:explanation|description)\s+only\b|\bno\s+code\b' \
+        ")",
+        Regexp::IGNORECASE
+      )
+      # The text plainly admits the action did NOT / cannot happen — an honest
+      # non-completion, not a fabricated "done". A bare "can't"/"unable" anywhere
+      # in the answer is enough; this only EXEMPTS, never accuses, so a generous
+      # match is safe.
+      INABILITY = Regexp.new(
+        '\b(?:can\s?\'?t|cannot|could\s?n\'?t|unable\s+to|won\s?\'?t\s+be\s+able|' \
+        'don\s?\'?t\s+have|do\s+not\s+have|no\s+(?:such|test|way\s+to)|' \
+        'not\s+able\s+to|wasn\s?\'?t\s+able|isn\s?\'?t\s+(?:a|any)|there\s+(?:is|are)\s+no)\b',
+        Regexp::IGNORECASE
+      )
+      # PESSIMISTIC "I did NOTHING" claim (#381) — the inverse of every claim
+      # above. The model asserts it took no action at all: "I have not read a
+      # single file", "no tools were run/called", "I made no edits", "nothing was
+      # done/changed", "I didn't run/use any tools", "I have done nothing". A small
+      # phrase set is enough as the TRIGGER condition — we only act after VERIFYING
+      # it against the harness tool-call ledger (tool_count > 0), so a false
+      # positive here is harmless: the ledger gate, not the wording, decides.
+      # Kept model-agnostic (negations of read/run/edit/write/grep/search/tool +
+      # "nothing"/"no … was done" shapes), not a single provider's phrasing.
+      NO_ACTION_CLAIM = Regexp.new(
+        '\b(?:have\s+not|haven\s?\'?t|did\s+not|didn\s?\'?t|have\s+no|having\s+not|' \
+        'was\s+not\s+able\s+to|were\s+not\s+able\s+to|not)\b' \
+        '[^.!?\n]{0,40}?' \
+        '\b(?:read|run|ran|execute[d]?|use[d]?|call(?:ed)?|invoke[d]?|grep(?:ped)?|' \
+        "search(?:ed)?|made|make|edit(?:ed)?|written|wrote|create[d]?|change[d]?|" \
+        'modif(?:y|ied)|touch(?:ed)?|appl(?:y|ied)|do|done|perform(?:ed)?|take|taken|took)\b' \
+        '|\b(?:made|make|did|do|ran|run|read|wrote|written|applied|performed|took|taken)\b' \
+        '\s+(?:any\s+)?\bno\b\s+(?:tool[\s-]*calls?|tools?|files?|edits?|changes?|' \
+        'actions?|commands?|modifications?)\b' \
+        '|\b(?:no|zero)\s+(?:tool[\s-]*calls?|tools?|files?|edits?|changes?|actions?|' \
+        'commands?|modifications?)\b\s*' \
+        '(?:were\s+|was\s+|have\s+been\s+|been\s+|are\s+)?' \
+        '(?:run|ran|made|called|executed|invoked|read|performed|taken|applied)?\b' \
+        '|\b(?:nothing|no\s+action|no\s+work|not\s+a\s+single\s+\w+)\s+' \
+        '(?:was|were|has\s+been|have\s+been|got)\s+' \
+        '(?:done|run|made|changed|read|executed|performed|taken|applied|edited|written)\b' \
+        '|\b(?:i|we)\s+(?:have\s+|had\s+)?(?:did|do|done|made|changed|read|run|' \
+        'executed|performed|accomplished)\s+(?:absolutely\s+|literally\s+)?nothing\b' \
+        '|\bnot\s+a\s+single\s+(?:file|tool|edit|command|change)\b',
+        Regexp::IGNORECASE
+      )
+      # The tools whose execution actually MUTATES disk state — an "I made no
+      # edits" claim is most misleading when these ran. Used only to label the
+      # truthful harness note ("M edits"); the reconciliation itself fires on ANY
+      # tool having run, since "I read nothing" is equally false when a read ran.
+      MUTATING_TOOLS = %w[edit multi_edit write patch].freeze
+      # Build a guard for one turn. `exposed_tool_names` is the set of tool names
+      # the model actually had this turn (Loop's @turn_tools) — we only reflect a
+      # verb whose backing tool was on offer.
+      def initialize(exposed_tool_names:)
+        @exposed = Array(exposed_tool_names).map(&:to_s).uniq.freeze
+      end
+      # The corrective user message injected when a tracked action verb appears in
+      # a toolless turn. Names the offending claim so the model self-corrects.
+      #
+      # `prior_reflections` is how many corrective injections this turn ALREADY
+      # had. On the FIRST challenge (0 prior) we name the fabrication in full. On
+      # a later one (>= DECAY_AFTER_REFLECTIONS) we DECAY to a short, atomic,
+      # NON-accusatory instruction — repeating the heavy "you lied, nothing
+      # happened" framing is what compounded into the confession spiral (#353b);
+      # a single concrete "make the tool call or say you can't, in one line" is
+      # what actually recovered a stuck model.
+      def reflection_message(claimed_verb, prior_reflections: 0)
+        if prior_reflections >= DECAY_AFTER_REFLECTIONS
+          return "Still no tool call. Don't apologise or re-explain — just make " \
+                 "ONE actual tool call now to #{claimed_verb}, or reply in a " \
+                 "single line that you cannot and why."
+        end
+        "You said you'd #{claimed_verb} but issued NO tool call, so nothing " \
+          "actually happened — that text is not a real result and the file is " \
+          "unchanged on disk. Do ONE of two things now: (a) make the actual tool " \
+          "call to carry it out, or (b) if you cannot (missing info, blocked, " \
+          "denied, or no such capability), say plainly that you did NOT do it and " \
+          "explain why. Do NOT restate that it is done."
+      end
+      # A fabricated unified diff / patch / git-apply artifact in the prose —
+      # the F1 class: when its write tool is blocked, the model hands back a
+      # confident "ready to `git apply`" diff for files it never read, with
+      # invented hunks that would CORRUPT those files if applied. We detect the
+      # diff shape (a `--- a/…` + `+++ b/…` header, a `@@ … @@` hunk header, an
+      # explicit "git apply"/"apply this patch", or a ```diff/```patch fence) so
+      # that, on a denied/blocked turn, the diff is never surfaced as if it were
+      # a real, applicable artifact.
+      FABRICATED_DIFF = Regexp.new(
+        '^\s*---\s+a?/?\S.*\n\+\+\+\s+b?/?\S' \
+        '|^\s*@@\s.*@@' \
+        '|\bgit\s+apply\b' \
+        '|\bapply\s+(?:this\s+)?(?:the\s+)?patch\b' \
+        '|```(?:diff|patch)\b',
+        Regexp::IGNORECASE
+      )
+      # The honest answer that REPLACES a fabricated "I did the mutation" final
+      # answer once the reflection budget is spent (G1, BINDING). The model ran
+      # zero tools, so nothing changed on disk; we say so deterministically and
+      # name the claim, instead of letting its fabricated "Done. committed as
+      # <sha>" stand. `claim` is the human-readable phrase the guard already
+      # built ("committed the change", "the file now …").
+      def replacement_for_fabrication(claim)
+        "No tool call was made, so nothing was changed on disk — I did not " \
+          "#{claim}. (The previous lines claiming otherwise were not backed by " \
+          "any action and are not a real result.) Tell me to proceed and I'll " \
+          "actually run the tool to carry it out."
+      end
+      # The honest answer that REPLACES a success-narration OR a fabricated diff
+      # emitted AFTER a tool was denied/blocked this turn (F1/F2). The action was
+      # blocked and nothing was applied; any diff in the text is not a real,
+      # applicable artifact. `noninteractive` tailors the escape hatch: headless
+      # fail-closed → `--yolo` (and notes approvals.mode: skip no longer
+      # auto-runs non-interactively, #281/F2); user-denied → re-ask/approve.
+      def replacement_for_blocked(noninteractive:)
+        hatch =
+          if noninteractive
+            "nothing was applied. To run it non-interactively pass `--yolo` " \
+              "(note: `approvals.mode: skip` no longer auto-runs non-interactively " \
+              "for safety — use `--yolo`), or run rubino interactively and approve " \
+              "the action."
+          else
+            "nothing was applied. Approve the action (or re-run and allow it) " \
+              "if you want me to carry it out."
+          end
+        "That action was blocked, so #{hatch} Any diff or \"done\" above is not " \
+          "a real, applied change — I did not read/write those files, so I'm not " \
+          "presenting it as something to `git apply`."
+      end
+      # The honest answer that REPLACES a fabricated "I changed the directory"
+      # final turn. rubino genuinely cannot cd, so we tell the truth and point at
+      # the real mechanisms instead of letting the model claim a no-op.
+      CD_HONEST_ANSWER =
+        "I can't change my working directory — I have no `cd` tool, and each command " \
+        "runs from the session's workspace root, so a `cd` would not persist anyway. " \
+        "To work against another directory, either add it with `/add-dir <path>` " \
+        "(grants access this session) or relaunch rubino from that directory. " \
+        "If you want, tell me the path and I'll run commands against it explicitly " \
+        "(e.g. by passing the full path to each command)."
+      # The verdict for a finished, TEXT-ONLY turn.
+      #
+      #   tool_count   — tools that actually ran this turn (Loop's @tool_count)
+      #   denied_count — tools denied/blocked this turn (Loop's @denied_count):
+      #                  user-denied AND headless fail-closed both count here.
+      #   content      — the assistant's final text
+      #   noninteractive — true when a denial this turn was a headless
+      #                  "no interactive session" block (#260), so the honest
+      #                  message can point at `--yolo` (F2) vs "approve it".
+      #   terminal     — true on the LAST chance (reflection budget exhausted):
+      #                  the guard must now be BINDING and REPLACE the answer
+      #                  rather than ask for one more corrective turn (G1).
+      #   user_request — the LATEST genuine user message that drove this turn (the
+      #                  Loop passes the originating request, NOT a guard
+      #                  reflection). When it requested a NO-ACTION turn (plan /
+      #                  list / explain / "don't run" / "without tools" / "from
+      #                  memory"), the model is SUPPOSED to answer in prose with no
+      #                  tool call, so we skip the claim-challenge for this turn.
+      #
+      # Returns one of:
+      #   nil             — no fabrication detected; surface the text as-is.
+      #   [:cd, msg]      — replace the final answer with the honest cd message.
+      #   [:blocked, msg] — replace the answer: a tool was denied/blocked yet the
+      #                     text narrates success or emits a fabricated diff.
+      #   [:reflect, vb]  — reflect a corrective turn; `vb` is the claimed verb.
+      #   [:replace, msg] — BINDING terminal override: replace the fabricated
+      #                     "done" final text with the honest deterministic msg.
+      #
+      # The Loop decides what to do with each (rewrite vs re-enter the loop), and
+      # owns the MAX_REFLECTIONS cap (passing terminal: once it is reached).
+      def evaluate(content:, tool_count:, denied_count:, noninteractive: false,
+                   terminal: false, user_request: nil)
+        text = content.to_s
+        return nil if text.strip.empty?
+        return nil unless tool_count.to_i.zero?
+        # A tool was DENIED/BLOCKED this turn but none RAN. If the text then
+        # narrates success or hands back a fabricated diff/patch for files it
+        # never wrote (F1/F2), the action did NOT happen — replace it with the
+        # honest "blocked, nothing applied, use --yolo" message so the invented
+        # diff can never read as an applicable artifact. An honest "it was
+        # blocked / I couldn't" answer is left alone.
+        if denied_count.to_i.positive?
+          return nil unless blocked_but_claims?(text)
+          return [:blocked, replacement_for_blocked(noninteractive: noninteractive)]
+        end
+        # A turn that ends by asking the user is a legitimate clarify, not a
+        # claimed completion.
+        return nil if asks_user?(text)
+        # The user EXPLICITLY requested a no-action turn (a plan, a list, an
+        # explanation, an answer from memory, or "don't run/use any tools"). On
+        # such a turn the model is supposed to produce prose and call no tool, so
+        # its "here's the plan; I'll add X next" is the requested deliverable, not
+        # a fabricated "done". Skip the claim-challenge so the guard doesn't make
+        # the model apologise for obeying. (#353a) A plain task request matches
+        # none of these, so the anti-fabrication core still fires on real tasks.
+        return nil if no_action_requested?(user_request)
+        return [:cd, CD_HONEST_ANSWER] if cd_intent?(text)
+        # The model already owned up that it could NOT do the thing ("I can't
+        # run it because…", "unable to", "there is no test file"). An action
+        # verb in that sentence is honest framing, not a fabricated success —
+        # don't nag it.
+        return nil if honest_inability?(text)
+        # HIGHEST-COST class first: a fabricated file/state/git MUTATION
+        # ("Updated both methods", "committed as 0f60f1d", "README now contains
+        # 'API v2'") anywhere in the message. Prioritised over the trailing-intent
+        # verb below so a message that bundles a fake edit-claim with a "then I'll
+        # run the tests" is challenged on the EDIT, not the trailing run (r5c B1).
+        claim = fabricated_git_result(text) ||
+                fabricated_mutation(text) ||
+                fabricated_action_verb(text)
+        return nil if claim.nil?
+        # BINDING terminal override (G1): the reflection budget is spent and the
+        # model is STILL asserting a mutation it never made. Don't surface the
+        # fabrication — replace it with the honest deterministic message. Off the
+        # terminal turn we ask for one corrective turn first.
+        return [:replace, replacement_for_fabrication(claim)] if terminal
+        [:reflect, claim]
+      end
+      # PESSIMISTIC reconciliation (#381) — the INVERSE of #evaluate, and the only
+      # guard path that fires when tools DID run. A turn that genuinely executed
+      # tool calls (typically the budget/rate-limit-exhausted FORCED summary) can
+      # end with a confident "I did nothing — not a single file read, no edits"
+      # even though the harness ledger shows N tool calls and M real edits. Letting
+      # that stand makes the user believe no work happened and miss correct,
+      # uncommitted changes. The harness is the authority on side-effects, so we
+      # reconcile: append a truthful note naming what the ledger actually recorded.
+      #
+      #   content     — the final assistant text (the summary).
+      #   tool_count  — tools that actually RAN this turn (Loop's @tool_count).
+      #   edit_count  — of those, how many were MUTATING (Loop's @edit_count).
+      #
+      # Returns the harness diagnostic note ALONE (or nil), without splicing it
+      # into the answer text. The Loop routes this to STDERR / an event instead
+      # of appending it to the returned answer, so the note never pollutes
+      # `--output-format text` stdout (#418). Returns nil to leave the summary
+      # alone (the only-safe default) unless ALL hold:
+      #   * at least one tool ran (the ledger has something to contradict);
+      #   * the text actually CLAIMS no/zero action was taken (the small phrase set
+      #     above — the trigger), so a truthful "I ran X then Y" summary that names
+      #     its tools is left completely alone;
+      #   * the text does NOT already own up to the count (so we never double-note).
+      def pessimistic_summary_note(content:, tool_count:, edit_count: 0)
+        text = content.to_s
+        ran  = tool_count.to_i
+        return nil unless ran.positive?
+        return nil unless NO_ACTION_CLAIM.match?(text)
+        # The summary already reports the real count truthfully — don't pile on.
+        return nil if already_acknowledges_ledger?(text, ran)
+        harness_ledger_note(ran, edit_count.to_i)
+      end
+      # The truthful, harness-authored line appended to (or standing in for) a
+      # pessimistic summary. Keyed entirely on the ledger counts, never on wording.
+      def harness_ledger_note(tool_count, edit_count)
+        edits =
+          if edit_count.positive?
+            " (#{edit_count} edit#{"s" unless edit_count == 1} — review uncommitted changes)"
+          else
+            ""
+          end
+        "[harness note] That summary is not accurate: #{tool_count} tool " \
+          "call#{"s" unless tool_count == 1} actually ran this turn#{edits}. The " \
+          "tool-call ledger — not the summary — is the record of what happened, so " \
+          "review the working tree for real, possibly uncommitted, changes before " \
+          "assuming nothing was done."
+      end
+      private
+      # The summary already states, truthfully, that the tools ran (it cites the
+      # real count or owns the work) — so the pessimistic "I did nothing" trigger
+      # was a false positive (e.g. "I ran 5 tools but made no DB changes") and we
+      # must not append a contradicting note. We only suppress when the EXACT ran
+      # count appears next to a tool/call/ran word, which a genuine "I did nothing"
+      # confabulation never contains.
+      def already_acknowledges_ledger?(text, ran)
+        /\b#{ran}\b[^.!?\n]{0,30}?\b(?:tool|call|ran|executed|edit)/i.match?(text) ||
+          /\bharness\s+note\b/i.match?(text)
+      end
+      # The latest user request asked for a NO-ACTION turn (plan / list / explain
+      # / recall-from-memory / explicit "don't run|use tools"). nil/blank request
+      # → not a no-action turn (we can't tell, so we fall through to the normal
+      # fabrication checks — fail-safe toward catching fabrications). (#353a)
+      def no_action_requested?(user_request)
+        req = user_request.to_s
+        return false if req.strip.empty?
+        NO_ACTION_REQUEST.match?(req)
+      end
+      def honest_inability?(text)
+        INABILITY.match?(text)
+      end
+      # After a tool was DENIED/BLOCKED this turn, does the text still try to pass
+      # off the action as done — by narrating success (a mutation/action claim or
+      # a state-result), OR by handing back a fabricated unified diff/patch for
+      # files it never wrote (F1)? A fabricated diff fires on its own (the most
+      # dangerous artifact: it reads as `git apply`-able). A plain honest "it was
+      # blocked / I couldn't" with no success-claim and no diff is left alone.
+      def blocked_but_claims?(text)
+        return true if FABRICATED_DIFF.match?(text)
+        # An honest "blocked / can't / nothing was applied" answer with no diff
+        # is a real deny-recovery summary — leave it alone.
+        return false if honest_inability?(text) || blocked_honest?(text)
+        !!(cd_intent?(text) ||
+           fabricated_git_result(text) ||
+           fabricated_mutation(text) ||
+           fabricated_action_verb(text) ||
+           STATE_RESULT.match?(text))
+      end
+      # A fabricated VCS-mutation RESULT narrated as fact ("committed as 0f60f1d",
+      # "created branch feature/tax", "pushed to origin/main") — the G1 shape the
+      # verb matchers miss. Gated on a git/shell tool being on offer, and on the
+      # claim NOT being 2nd-person advice. Returns the human-readable claim phrase
+      # ("commit/create that on a branch") or nil.
+      def fabricated_git_result(text)
+        return nil unless GIT_TOOLS.any? { |t| @exposed.include?(t) }
+        return nil if advice_only?(text)
+        return nil unless GIT_RESULT.match?(text)
+        "make that git change (commit/branch/push)"
+      end
+      def blocked_honest?(text)
+        BLOCKED_HONEST.match?(text)
+      end
+      # The text claims to have changed the working directory — and rubino can't.
+      def cd_intent?(text)
+        return false unless CD_INTENT.match?(text)
+        # Only when framed as the assistant's own action / completion, not as
+        # advice to the user ("you can cd into …", "run cd /x yourself").
+        first_person_anywhere?(text) || CD_INTENT.match?(leading_clause(text))
+      end
+      # The first tracked action verb the text asserts as the assistant's own
+      # doing, whose backing tool rubino actually exposed this turn, as a
+      # base-form claim phrase ("run that", "commit that") that reads naturally
+      # in BOTH "You said you'd <claim>" (reflection) and "I did not <claim>"
+      # (binding replacement). nil when none.
+      def fabricated_action_verb(text)
+        ACTION_TOOLS.each do |verb, tools|
+          next unless tools.any? { |t| @exposed.include?(t) }
+          next unless asserts_verb?(text, verb)
+          return "#{action_base(verb)} that"
+        end
+        nil
+      end
+      def action_base(verb)
+        ACTION_BASE.fetch(verb, verb)
+      end
+      # The first fabricated file/state MUTATION the toolless turn asserts, as a
+      # human-readable claim phrase for the reflection ("updated the file",
+      # "added the docstring", "the file now contains that"). Fires on:
+      #   * a past-tense mutation verb asserted as the assistant's own action
+      #     ANYWHERE in the message (not just sentence-initial), or
+      #   * a state-RESULT phrasing ("X now contains …", "the file now has …").
+      # Gated on a write-family tool being exposed and on the claim NOT being
+      # 2nd-person advice ("you should add…", "you can write…", "to update…").
+      # nil when the turn makes no fabricated mutation claim.
+      def fabricated_mutation(text)
+        return nil unless WRITE_FAMILY.any? { |t| @exposed.include?(t) }
+        return nil if advice_only?(text)
+        MUTATION_TOOLS.each do |past, tools|
+          next unless tools.any? { |t| @exposed.include?(t) }
+          next unless asserts_mutation?(text, past)
+          # Base form so the phrase reads in BOTH "you'd <claim>" and "I did not
+          # <claim>" ("update the file", "apply the change").
+          return "#{MUTATION_BASE.fetch(past, past)} the file"
+        end
+        # State-result phrasing with no action verb at all ("README now contains
+        # 'API v2'", "the file now has the import") — a mutation dressed as fact.
+        return "make that change to the file" if STATE_RESULT.match?(text)
+        nil
+      end
+      # True when `past` (an already-past/participle mutation form) is asserted as
+      # the assistant's OWN completed (or unfulfilled-future) mutation anywhere in
+      # the text. Built from MUTATION_SELF_SRC with the past form and its base
+      # form (for the "I'll <base>…" future framing) substituted in.
+      def asserts_mutation?(text, past)
+        base = MUTATION_BASE.fetch(past, past)
+        src = MUTATION_SELF_SRC.gsub("VERBBASE", Regexp.escape(base))
+                               .gsub("VERB", Regexp.escape(past))
+        Regexp.new(src, Regexp::IGNORECASE).match?(text)
+      end
+      # The whole message is 2nd-person ADVICE / a how-to, not a 1st-person
+      # claim — "you should add the import", "you can write it with…", "to update
+      # the file, use the edit tool". A mutation verb in that framing is help
+      # text, not a fabricated completion, so the guard must leave it alone. We
+      # only treat it as advice when there is NO competing first-person claim, so
+      # "I updated it; you can run it" is still challenged.
+      def advice_only?(text)
+        return false if /\b(?:i|we)\b\s*'?(?:ll|ve|m)?\b/i.match?(text) &&
+                        first_person_anywhere?(text)
+        /\byou\s+(?:can|could|should|may|might|will|need\s+to|have\s+to|want\s+to)\b/i
+          .match?(text) ||
+          /\bto\s+\w+[^.!?\n]{0,40}?,?\s*use\s+the\b/i.match?(text)
+      end
+      # True when `verb` appears in a first-person "I'll/I just/now" framing OR as
+      # a bare sentence-initial progressive/past — the narration shapes that mean
+      # "I am doing / did this", as opposed to describing it to the user.
+      def asserts_verb?(text, verb)
+        # The verb plus all its surface forms (write/writing/wrote/written via
+        # the union) — so "i've written", "i ran", "i'm saving" all match the
+        # first-person framing, not just the dictionary form.
+        alt = verb_alternation(verb)
+        fp = Regexp.new(FIRST_PERSON_VERB_SRC.sub("VERB", alt), Regexp::IGNORECASE)
+        return true if fp.match?(text)
+        # Sentence-initial / list-item progressive-or-past: "Running…", "Saved…".
+        bare = Regexp.new(BARE_LEAD_VERB_SRC.sub("VERBING", verbings_for(verb)),
+                          Regexp::IGNORECASE)
+        return true if bare.match?(text)
+        # Completion-lead narration: "Done — created the file.", "✓ saved.",
+        # "All set, removed mode()." A done/✓/all-set marker immediately before a
+        # past/progressive form is the model declaring the work finished.
+        lead = Regexp.new(COMPLETION_LEAD_SRC.sub("VERBING", verbings_for(verb)),
+                          Regexp::IGNORECASE)
+        lead.match?(text)
+      end
+      # The regex-source alternation of a verb and every surface form we track for
+      # it (run|running|ran, write|writing|wrote|written, …). Used to match the
+      # verb in a first-person framing regardless of tense.
+      def verb_alternation(verb)
+        forms = [verb] + SURFACE_FORMS.fetch(verb, ["#{verb}ing", "#{verb}ed"])
+        # write→written participle that the regular -ed/-ing forms miss.
+        forms << "written" if %w[write wrote].include?(verb)
+        Regexp.union(forms.uniq).source
+      end
+      # The surface forms that begin a bare narration sentence for a given base
+      # verb: the bare verb (sentence-initial imperative-as-claim "Run the tests
+      # now."), its progressive ("Running…"), and its past ("Ran…"/"Saved…").
+      # Stored explicitly rather than derived so English irregulars (run→running,
+      # write→writing→wrote) are correct.
+      def verbings_for(verb)
+        forms = [verb] + SURFACE_FORMS.fetch(verb, ["#{verb}ing", "#{verb}ed"])
+        forms << "written" if %w[write wrote].include?(verb)
+        Regexp.union(forms.uniq).source
+      end
+      def first_person_anywhere?(text)
+        /\b(?:i\s?'?ll|i\s?'?ve|i\s+have|i\s+will|i\s+just|i\s?'?m|i\s+am|let\s+me|
+            i\s+chang|i\s+switch|i\s+mov|now\s+i)\b/ix.match?(text)
+      end
+      # The first sentence/clause, where a bare "Changed directory." lead-in lives.
+      def leading_clause(text)
+        text.strip[/\A[^.!?\n]{0,120}/].to_s
+      end
+      # The text ends by asking the user (a trailing question) — a legitimate
+      # clarify, not a fabricated completion. We look only at the tail so a
+      # rhetorical "?" earlier in a long answer doesn't exempt a fabrication.
+      def asks_user?(text)
+        tail = text.strip[-160..] || text.strip
+        tail.rstrip.end_with?("?")
+      end
+    end
+  end
+end