RubyGems - rubino-agent - Versions diffs - 0.3.0 → 0.5.0 - Mend

rubino-agent 0.3.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

checksums.yaml +4 -4
data/.rubocop_todo.yml +11 -2
data/AGENTS.md +1 -1
data/CHANGELOG.md +172 -5
data/CONTRIBUTING.md +10 -1
data/README.md +14 -5
data/Rakefile +31 -0
data/docs/agents.md +42 -23
data/docs/architecture.md +2 -2
data/docs/commands.md +35 -3
data/docs/configuration.md +20 -23
data/docs/getting-started.md +5 -3
data/docs/security.md +16 -5
data/docs/skills.md +31 -0
data/docs/troubleshooting.md +1 -1
data/exe/rubino +16 -2
data/install.sh +721 -59
data/lib/rubino/active_agent.rb +73 -0
data/lib/rubino/agent/action_claim_guard.rb +881 -0
data/lib/rubino/agent/agent_registry.rb +5 -2
data/lib/rubino/agent/definition.rb +1 -9
data/lib/rubino/agent/fallback_chain.rb +0 -6
data/lib/rubino/agent/iteration_budget.rb +109 -3
data/lib/rubino/agent/loop.rb +476 -20
data/lib/rubino/agent/model_call_runner.rb +81 -3
data/lib/rubino/agent/prompts/build.txt +22 -5
data/lib/rubino/agent/response_validator.rb +8 -0
data/lib/rubino/agent/runner.rb +133 -8
data/lib/rubino/agent/tool_executor.rb +166 -14
data/lib/rubino/agent/truncation_continuation.rb +4 -1
data/lib/rubino/api/server.rb +19 -0
data/lib/rubino/attachments/classify.rb +35 -17
data/lib/rubino/boot/config_guard.rb +71 -0
data/lib/rubino/cli/chat/completion_builder.rb +42 -6
data/lib/rubino/cli/chat/idle_card_host.rb +7 -1
data/lib/rubino/cli/chat/session_resolver.rb +87 -21
data/lib/rubino/cli/chat_command.rb +1189 -50
data/lib/rubino/cli/commands.rb +282 -2
data/lib/rubino/cli/config_command.rb +68 -8
data/lib/rubino/cli/doctor_command.rb +204 -12
data/lib/rubino/cli/jobs_command.rb +12 -0
data/lib/rubino/cli/memory_command.rb +53 -20
data/lib/rubino/cli/onboarding_wizard.rb +79 -6
data/lib/rubino/cli/session_command.rb +172 -18
data/lib/rubino/cli/setup_command.rb +131 -8
data/lib/rubino/cli/skills_command.rb +183 -9
data/lib/rubino/cli/trust_gate.rb +16 -7
data/lib/rubino/commands/built_ins.rb +2 -0
data/lib/rubino/commands/command.rb +12 -2
data/lib/rubino/commands/executor.rb +149 -12
data/lib/rubino/commands/handlers/agent_switch.rb +100 -0
data/lib/rubino/commands/handlers/agents.rb +156 -41
data/lib/rubino/commands/handlers/config.rb +4 -1
data/lib/rubino/commands/handlers/help.rb +113 -14
data/lib/rubino/commands/handlers/memory.rb +15 -5
data/lib/rubino/commands/handlers/sessions.rb +26 -3
data/lib/rubino/commands/handlers/status.rb +9 -4
data/lib/rubino/commands/loader.rb +12 -0
data/lib/rubino/config/configuration.rb +86 -24
data/lib/rubino/config/defaults.rb +140 -33
data/lib/rubino/config/loader.rb +62 -12
data/lib/rubino/config/validator.rb +341 -0
data/lib/rubino/config/writer.rb +123 -31
data/lib/rubino/context/compressor.rb +184 -22
data/lib/rubino/context/environment_inspector.rb +2 -2
data/lib/rubino/context/file_discovery.rb +2 -2
data/lib/rubino/context/message_boundary.rb +27 -1
data/lib/rubino/context/project_languages.rb +90 -0
data/lib/rubino/context/prompt_assembler.rb +105 -22
data/lib/rubino/context/summary_builder.rb +45 -4
data/lib/rubino/context/token_budget.rb +36 -11
data/lib/rubino/context/token_estimate.rb +45 -0
data/lib/rubino/context/tool_result_pruner.rb +81 -0
data/lib/rubino/database/connection.rb +154 -3
data/lib/rubino/database/migrations/001_create_initial_schema.rb +314 -40
data/lib/rubino/database/migrator.rb +98 -5
data/lib/rubino/documents/cap_exceeded.rb +13 -0
data/lib/rubino/documents/converters/csv.rb +4 -3
data/lib/rubino/documents/converters/docx.rb +29 -5
data/lib/rubino/documents/converters/html.rb +5 -1
data/lib/rubino/documents/converters/json.rb +2 -1
data/lib/rubino/documents/converters/pdf.rb +11 -2
data/lib/rubino/documents/converters/plain.rb +2 -1
data/lib/rubino/documents/converters/pptx.rb +11 -2
data/lib/rubino/documents/converters/xlsx.rb +35 -4
data/lib/rubino/documents/converters/xml.rb +2 -1
data/lib/rubino/documents/limits.rb +210 -0
data/lib/rubino/documents.rb +10 -3
data/lib/rubino/errors.rb +36 -5
data/lib/rubino/interaction/cancel_token.rb +19 -3
data/lib/rubino/interaction/events.rb +13 -0
data/lib/rubino/interaction/lifecycle.rb +99 -13
data/lib/rubino/interaction/polishing.rb +176 -0
data/lib/rubino/jobs/cron_job_repository.rb +5 -8
data/lib/rubino/jobs/handlers/cleanup_sessions_job.rb +11 -0
data/lib/rubino/jobs/handlers/distill_skill_job.rb +65 -9
data/lib/rubino/jobs/queue.rb +63 -8
data/lib/rubino/jobs/runner.rb +24 -6
data/lib/rubino/jobs/worker.rb +0 -4
data/lib/rubino/llm/adapter_response.rb +47 -4
data/lib/rubino/llm/credential_check.rb +15 -16
data/lib/rubino/llm/error_classifier.rb +89 -1
data/lib/rubino/llm/inline_think_filter.rb +69 -12
data/lib/rubino/llm/request.rb +30 -3
data/lib/rubino/llm/ruby_llm_adapter.rb +394 -46
data/lib/rubino/llm/tool_bridge.rb +113 -9
data/lib/rubino/mcp/manager.rb +18 -1
data/lib/rubino/mcp/mcp_tool_wrapper.rb +14 -3
data/lib/rubino/memory/aux_retry.rb +107 -0
data/lib/rubino/memory/backends/sqlite.rb +73 -44
data/lib/rubino/memory/backends.rb +23 -7
data/lib/rubino/memory/salience_gate.rb +103 -0
data/lib/rubino/memory/sqlite_extraction.rb +70 -0
data/lib/rubino/memory/sqlite_extraction_prompt.rb +11 -0
data/lib/rubino/memory/store.rb +33 -5
data/lib/rubino/memory/threat_scanner.rb +52 -0
data/lib/rubino/output/cost.rb +52 -0
data/lib/rubino/output/headless_block_latch.rb +53 -0
data/lib/rubino/output/result_serializer.rb +222 -0
data/lib/rubino/output/turn_recorder.rb +77 -0
data/lib/rubino/security/approval_policy.rb +227 -32
data/lib/rubino/security/command_allowlist.rb +79 -4
data/lib/rubino/security/doom_loop_detector.rb +21 -2
data/lib/rubino/security/hardline_guard.rb +189 -16
data/lib/rubino/security/pattern_matcher.rb +28 -5
data/lib/rubino/security/prefix_deriver.rb +25 -6
data/lib/rubino/security/readonly_commands.rb +145 -5
data/lib/rubino/security/secret_path.rb +134 -0
data/lib/rubino/security/url_safety.rb +255 -0
data/lib/rubino/session/repository.rb +212 -11
data/lib/rubino/session/store.rb +139 -14
data/lib/rubino/skills/installer.rb +230 -0
data/lib/rubino/skills/prompt_index.rb +2 -2
data/lib/rubino/skills/registry.rb +52 -1
data/lib/rubino/skills/skill.rb +64 -3
data/lib/rubino/skills/skill_tool.rb +16 -5
data/lib/rubino/tools/background_tasks.rb +157 -13
data/lib/rubino/tools/base.rb +204 -3
data/lib/rubino/tools/edit_tool.rb +73 -18
data/lib/rubino/tools/glob_tool.rb +48 -9
data/lib/rubino/tools/grep_tool.rb +103 -9
data/lib/rubino/tools/multi_edit_tool.rb +64 -9
data/lib/rubino/tools/patch_tool.rb +5 -0
data/lib/rubino/tools/read_attachment_tool.rb +3 -1
data/lib/rubino/tools/read_tool.rb +33 -15
data/lib/rubino/tools/read_tracker.rb +153 -35
data/lib/rubino/tools/registry.rb +113 -12
data/lib/rubino/tools/result.rb +9 -1
data/lib/rubino/tools/ruby_tool.rb +0 -0
data/lib/rubino/tools/shell_registry.rb +70 -0
data/lib/rubino/tools/shell_tool.rb +40 -1
data/lib/rubino/tools/summarize_file_tool.rb +6 -0
data/lib/rubino/tools/task_stop_tool.rb +10 -16
data/lib/rubino/tools/task_tool.rb +36 -8
data/lib/rubino/tools/vision_tool.rb +5 -0
data/lib/rubino/tools/webfetch_tool.rb +39 -7
data/lib/rubino/tools/websearch_tool.rb +92 -30
data/lib/rubino/tools/write_tool.rb +23 -4
data/lib/rubino/ui/api.rb +10 -1
data/lib/rubino/ui/base.rb +11 -0
data/lib/rubino/ui/bottom_composer.rb +382 -74
data/lib/rubino/ui/cli.rb +515 -83
data/lib/rubino/ui/completion_menu.rb +11 -7
data/lib/rubino/ui/headless_trace.rb +63 -0
data/lib/rubino/ui/live_region.rb +70 -7
data/lib/rubino/ui/markdown_renderer.rb +142 -7
data/lib/rubino/ui/notifier.rb +0 -2
data/lib/rubino/ui/null.rb +52 -5
data/lib/rubino/ui/paste_store.rb +16 -2
data/lib/rubino/ui/queued_indicators.rb +6 -1
data/lib/rubino/ui/status_bar.rb +61 -7
data/lib/rubino/ui/streaming_markdown.rb +59 -6
data/lib/rubino/ui/subagent_view.rb +29 -4
data/lib/rubino/ui/tool_label.rb +52 -0
data/lib/rubino/update_check.rb +39 -4
data/lib/rubino/util/atomic_file.rb +117 -0
data/lib/rubino/util/ignore_rules.rb +120 -0
data/lib/rubino/util/output.rb +229 -12
data/lib/rubino/util/secrets_mask.rb +70 -7
data/lib/rubino/util/spill_store.rb +153 -0
data/lib/rubino/version.rb +1 -1
data/lib/rubino/workspace.rb +9 -1
data/lib/rubino.rb +191 -7
data/rubino-agent.gemspec +1 -0
data/skills/ruby-expert/SKILL.md +1 -0
metadata +42 -12
data/lib/rubino/agent/router.rb +0 -65
data/lib/rubino/database/migrations/002_create_runs.rb +0 -45
data/lib/rubino/database/migrations/003_create_skill_states.rb +0 -15
data/lib/rubino/database/migrations/004_create_cron_jobs.rb +0 -36
data/lib/rubino/database/migrations/005_create_oauth_connections.rb +0 -27
data/lib/rubino/database/migrations/006_create_webhook_deliveries.rb +0 -34
data/lib/rubino/database/migrations/007_create_messages_fts.rb +0 -59
data/lib/rubino/database/migrations/008_create_memory_facts.rb +0 -75
data/lib/rubino/database/migrations/009_create_memory_graph.rb +0 -55
data/lib/rubino/database/migrations/010_add_owner_pid_to_sessions.rb +0 -20

data/lib/rubino/tools/glob_tool.rb CHANGED Viewed

@@ -29,6 +29,11 @@ module Rubino
             max_results: {
               type: "integer",
               description: "Maximum number of results (default: 100)"
+            },
+            include_ignored: {
+              type: "boolean",
+              description: "Include files git ignores (.gitignore, build artifacts). " \
+                           "Default false — results honor .gitignore like grep does."
             }
           },
           required: %w[pattern]
@@ -40,18 +45,20 @@ module Rubino
       end
       def call(arguments)
-        pattern = arguments["pattern"] || arguments[:pattern]
-        path = arguments["path"] || arguments[:path] || "."
+        pattern     = arguments["pattern"] || arguments[:pattern]
+        path        = arguments["path"]    || arguments[:path] || "."
         max_results = arguments["max_results"] || arguments[:max_results] || 100
+        include_ignored = arguments["include_ignored"] || arguments[:include_ignored] || false
-        expanded_path = File.expand_path(path)
-        return "Error: Directory not found: #{path}" unless File.directory?(expanded_path)
+        # Glob is BROAD (#406): it resolves any path like Hermes/Claude/Codex.
+        # The read allowlist was never the data-loss boundary (that's on the
+        # WRITE path); glob only lists file PATHS (no content), so there is
+        # nothing to denylist here — secret protection lives on read/grep.
+        expanded_path = File.expand_path(path, workspace_root)
+        full_pattern  = resolve_pattern(pattern, path, expanded_path)
+        return full_pattern if full_pattern.is_a?(String) && full_pattern.start_with?("Error:")
-        full_pattern = File.join(expanded_path, pattern)
-        files = Dir.glob(full_pattern)
-                   .select { |f| File.file?(f) }
-                   .sort_by { |f| -File.mtime(f).to_i }
-                   .first(max_results)
+        files = matching_files(full_pattern, expanded_path, max_results, include_ignored)
         if files.empty?
           "No files matched pattern: #{pattern}"
@@ -64,6 +71,38 @@ module Rubino
             body_kind: :plain }
         end
       end
+      private
+      # Globs +full_pattern+, drops dirs and (by default) git-ignored files,
+      # sorts newest-first, and caps at +max_results+. Honoring .gitignore here
+      # keeps glob consistent with grep's rg path (#375c); include_ignored: true
+      # opts back into the raw set.
+      def matching_files(full_pattern, expanded_path, max_results, include_ignored)
+        ignore = include_ignored ? nil : Util::IgnoreRules.new
+        Dir.glob(full_pattern)
+           .select { |f| File.file?(f) }
+           .reject { |f| ignore&.ignored?(f, expanded_path) }
+           .sort_by { |f| -File.mtime(f).to_i }
+           .first(max_results)
+      end
+      # Builds the pattern passed to Dir.glob.
+      #
+      # An ABSOLUTE pattern (e.g. `/work/shopkit/cart.py`) names the exact file
+      # already — glob it as-is. Joining it onto the base produced a doubled
+      # path (`File.join("/work", "/work/…")` → `/work/work/…`) that matched
+      # nothing, so `glob` of a file that plainly exists returned "No files
+      # matched" and the agent fell back to `ls` (r6 F1). A RELATIVE pattern is
+      # anchored at the workspace primary root (terminal.cwd || launch cwd), not
+      # Dir.pwd, so it agrees with read/edit (r6 F3). Returns an "Error:" string
+      # when the relative base directory doesn't exist.
+      def resolve_pattern(pattern, path, expanded_path)
+        return pattern.to_s if pattern.to_s.start_with?(File::SEPARATOR)
+        return "Error: Directory not found: #{path}" unless File.directory?(expanded_path)
+        File.join(expanded_path, pattern)
+      end
     end
   end
 end

data/lib/rubino/tools/grep_tool.rb CHANGED Viewed

@@ -70,7 +70,19 @@ module Rubino
         before  = (ctx || arguments["before"] || arguments[:before] || 0).to_i.clamp(0, 50)
         after   = (ctx || arguments["after"]  || arguments[:after]  || 0).to_i.clamp(0, 50)
-        expanded_path = File.expand_path(path)
+        expanded_path = expand_workspace_path(path)
+        # Search is BROAD (#406): grep resolves any NON-secret path like
+        # Hermes/Claude/Codex. A grep whose `path` is a SECRET file directly
+        # (#446) is gated UPSTREAM by Security::ApprovalPolicy#decide (→ :ask),
+        # exactly like read — so it is NOT refused here; an approved grep of a
+        # secret file proceeds, a denied/headless one never reaches #call.
+        #
+        # F2: a DIRECTORY grep with `include: "*.env"` is NOT a secret target —
+        # the gate above can't see it — but rg's --glob OVERRIDES the default
+        # hidden-exclusion and would LEAK the matched .env lines. We therefore
+        # post-filter the RESULTS (see #filter_secret_hits): any result line that
+        # points at a secret file is stripped, so secrets never escape via an
+        # include-glob regardless of approval.
         return "Error: Path not found: #{path}" unless File.exist?(expanded_path)
         if ripgrep_available?
@@ -86,6 +98,28 @@ module Rubino
         system("which rg > /dev/null 2>&1")
       end
+      # True when an rg output line (`<file>:<lineno>:…`, a `<file>:<lineno>-…`
+      # context line, or a bare `--` separator) points at a secret/credential
+      # file — used to strip it from the result set so an include-glob over a
+      # directory can't leak a secret (F2). rg prints the file path verbatim
+      # from the search root we gave it; when the root is a single FILE rg omits
+      # the path prefix, but that case is the directly-targeted (approved) grep,
+      # so we resolve a bare line against `search_root` and let it fall through
+      # as non-secret. The `--` separator carries no path and is kept.
+      def secret_result_line?(line, search_root)
+        return false if line.nil? || line.start_with?("--")
+        # Split off the leading "<file>:<lineno>" — rg uses ':' for matches and
+        # ':'/'-' for context, always after the line number. Take everything up
+        # to the LAST ':' or '-' that precedes a digit run + delimiter.
+        m = line.match(/\A(.*?):\d+[:-]/)
+        return false unless m
+        file = m[1]
+        file = File.expand_path(file, search_root) unless file.start_with?(File::SEPARATOR)
+        !secret_path_category(file).nil?
+      end
       def search_with_ripgrep(pattern, path, include_pattern, max_results, before, after)
         # Build argv array and use Open3 to avoid shell injection — pattern
         # and path are passed as separate arguments, never interpolated into a
@@ -104,29 +138,75 @@ module Rubino
         argv += ["-A", after.to_s]  if after.positive?
         argv += [pattern, path]
-        output = IO.popen(argv, err: %i[child out], &:read)
+        # STREAM rg's output line-by-line and STOP after max_results (#375a).
+        # `IO.popen(argv).read` buffered the ENTIRE rg output — a pattern that
+        # matches a huge file produced +100MB in memory just to `.first(50)` it.
+        # Read until we have max_results+1 lines (the +1 detects "there are
+        # more"), then close the pipe (SIGPIPE stops rg) so neither memory nor
+        # CPU scale with the match count.
+        # F2: filter secret hits ONLY for a DIRECTORY search (an include-glob
+        # like `*.env` can pull a credential file in). A grep whose path is the
+        # secret FILE itself was already approved by the upstream gate, so its
+        # own lines must be returned, not stripped.
+        filter_secrets = File.directory?(path)
+        lines = []
+        more_exist = false
+        IO.popen(argv, err: %i[child out]) do |io|
+          io.each_line do |line|
+            # Drop a hit that points at a secret file BEFORE it counts toward the
+            # cap, so a result set of only-secrets doesn't crowd out the cap with
+            # content we'll never return.
+            next if filter_secrets && secret_result_line?(line, path)
+            if lines.size >= max_results
+              more_exist = true
+              break
+            end
+            lines << line
+          end
+          io.close # close early → rg gets SIGPIPE and stops scanning
+        end
         status = $?.exitstatus
+        # When WE deliberately close the pipe early after hitting the cap
+        # (#391/regression #375), rg is killed mid-scan and exits non-zero —
+        # and on some platforms the broken-pipe exit is reported as 1, the SAME
+        # code rg uses for a genuine "no matches". The old `status != 1` guard
+        # therefore EXCLUDED that case and fell through to the `status == 1`
+        # branch, dropping the 50 matches we already collected and reporting
+        # "No matches". Whenever we collected matches AND closed early (more_exist),
+        # it is unambiguously a success regardless of rg's exit code; a real
+        # "no matches" is 0 collected lines and we never closed early, so it
+        # still reaches the status==1 branch and reports correctly.
+        status = 0 if lines.any? && (more_exist || status != 1)
         if status == 0
-          all_lines = output.lines
-          lines     = all_lines.first(max_results)
-          more      = all_lines.size - lines.size
+          # We can't cheaply know the exact remaining count once we stop early,
+          # so report "more" without an exact number when the cap was hit.
+          more      = more_exist
           header    = "#{lines.size} match(es) shown" \
-                      "#{" (#{more} more — raise max_results or narrow the pattern)" if more.positive?}"
+                      "#{" (more — raise max_results or narrow the pattern)" if more}"
           full      = "#{header}:\n\n#{lines.join}"
           { output: full,
-            metrics: "#{lines.size} match#{"es" if lines.size != 1}#{"+" if more.positive?}",
+            metrics: "#{lines.size} match#{"es" if lines.size != 1}#{"+" if more}",
             body: Util::Output.preview(full),
             body_kind: :plain }
         elsif status == 1
           "No matches found for pattern: #{pattern}"
         else
-          "Error executing search: #{output}"
+          "Error executing search: #{lines.join}"
         end
       end
       def search_with_ruby(pattern, path, include_pattern, max_results, before, after)
-        regex   = Regexp.new(pattern)
+        # The Ruby fallback is the LIVE path whenever rg isn't on PATH. A bad
+        # pattern the model emits (e.g. an unclosed paren) would otherwise
+        # raise RegexpError and hand the model a raw exception; return a clean,
+        # actionable tool error instead.
+        begin
+          regex = Regexp.new(pattern)
+        rescue RegexpError => e
+          return "Error: invalid regex pattern: #{e.message}"
+        end
         results = []
         # ripgrep accepts a single FILE as well as a directory; mirror that
@@ -134,8 +214,22 @@ module Rubino
         # `path` is a file we search it directly (include_pattern is moot).
         files = File.file?(path) ? [path] : Dir.glob(File.join(path, "**", include_pattern || "*"))
+        # Honor .gitignore the SAME way the rg path does (#375b): without this
+        # the fallback returned a different, larger set (build artifacts,
+        # node_modules, ignored secrets) than rg — non-deterministic on whether
+        # rg is installed. A single FILE path the model targeted directly is
+        # always searched (mirrors rg searching an explicit file argument).
+        ignore = Util::IgnoreRules.new
+        searching_file = File.file?(path)
         files.each do |file|
           next unless File.file?(file)
+          next if !searching_file && ignore.ignored?(file, path)
+          # F2: in a DIRECTORY search, never read a secret file's lines into
+          # results (an include-glob like `*.env` would otherwise leak it). A
+          # single-file grep the model targeted directly is already approved
+          # upstream, so it is searched normally.
+          next if !searching_file && secret_path_category(file)
           next if binary_file?(file)
           begin

data/lib/rubino/tools/multi_edit_tool.rb CHANGED Viewed

@@ -57,7 +57,11 @@ module Rubino
         return "Error: file_path is required" if file_path.nil? || file_path.to_s.empty?
         return "Error: edits must be a non-empty array" if !edits.is_a?(Array) || edits.empty?
-        expanded = File.expand_path(file_path)
+        expanded = expand_workspace_path(file_path)
+        # SECRET/credential edits (#446) are no longer HARD-refused here — they
+        # are gated UPSTREAM by Security::ApprovalPolicy#decide (→ :ask): an
+        # APPROVED multi_edit of your .env actually applies, a denied/headless
+        # one never reaches #call. The workspace sandbox below is unchanged.
         return workspace_violation_message(file_path) unless within_workspace?(expanded)
         return "Error: File not found: #{file_path}" unless File.exist?(expanded)
@@ -65,7 +69,11 @@ module Rubino
           return gate
         end
-        content       = File.read(expanded)
+        # Read RAW bytes (binary) so the read-modify-write preserves every byte
+        # outside the matched spans — a non-UTF-8 byte on an untouched line is
+        # written back verbatim (#326). The model-supplied needles/replacements
+        # are matched and spliced as bytes too (see Base#to_match_bytes).
+        content       = read_for_edit(expanded)
         working       = content.dup
         applied_count = 0
@@ -80,30 +88,77 @@ module Rubino
           replace_all = edit["replace_all"] || edit[:replace_all] || false
           return "Error: edit ##{idx + 1} is missing old_string or new_string" if old_s.nil? || new_s.nil?
+          # Empty needle would match at every char boundary and corrupt the
+          # file under replace_all (#329a) — reject it like a missing string.
+          return "Error: edit ##{idx + 1}: old_string is empty" if old_s.empty?
           return "Error: edit ##{idx + 1}: old_string and new_string are identical" if old_s == new_s
-          unless working.include?(old_s)
+          old_b = to_match_bytes(old_s)
+          new_b = to_match_bytes(new_s)
+          unless working.include?(old_b)
+            # Mental model was wrong — let the model's next read of this path
+            # bypass dedup and fetch fresh bytes for recovery (r5 B3).
+            @read_tracker&.note_edit_failure(expanded)
             return "Error: edit ##{idx + 1}: old_string not found (check whitespace; " \
                    "remember edits see the result of prior edits)"
           end
-          count = working.scan(old_s).size
+          count = working.scan(old_b).size
           if count > 1 && !replace_all
             return "Error: edit ##{idx + 1}: #{count} matches for old_string. " \
                    "Add surrounding context to disambiguate, or set replace_all: true."
           end
           working = if replace_all
-                      working.gsub(old_s) { new_s }
+                      working.gsub(old_b) { new_b }
                     else
-                      working.sub(old_s) { new_s }
+                      working.sub(old_b) { new_b }
                     end
           applied_count += replace_all ? count : 1
         end
-        File.write(expanded, working)
-        "Applied #{edits.size} edit(s), #{applied_count} replacement(s) in #{file_path}"
+        # Crash-safe write: temp-in-same-dir + fsync + atomic rename. The tool's
+        # description advertises "atomically" — make it true on the disk seam too,
+        # so a SIGINT/crash mid-flush leaves the ORIGINAL file intact (HIGH-1).
+        Util::AtomicFile.write_atomic(expanded, working)
+        # Refresh-on-own-write so a follow-up edit to this file isn't refused
+        # as "changed on disk since last read" (r5 B2).
+        @read_tracker&.note_write(expanded, working)
+        { output: "Applied #{edits.size} edit(s), #{applied_count} replacement(s) in #{file_path}",
+          metrics: "#{edits.size} edit#{"s" if edits.size != 1} · " \
+                   "#{applied_count} replacement#{"s" if applied_count != 1}",
+          body: build_diff_preview(edits),
+          body_kind: :diff }
       rescue StandardError => e
-        "Error: #{e.message}"
+        # Uniform with WriteTool/EditTool: a read-only target (Errno::EACCES)
+        # or any other filesystem error returns a clean message.
+        "Error editing #{file_path}: #{e.message}"
+      end
+      # Inline diff for the applied result, mirroring EditTool: per edit, the
+      # old lines as `-` then the new lines as `+`, edits separated by a blank
+      # line. Trimmed to the first MAX_DIFF_LINES so a big batch stays a
+      # preview (the edits all still apply).
+      MAX_DIFF_LINES = 16
+      private
+      def build_diff_preview(edits)
+        lines = []
+        edits.each_with_index do |edit, idx|
+          old_s = edit["old_string"] || edit[:old_string]
+          new_s = edit["new_string"] || edit[:new_string]
+          lines << "" unless idx.zero?
+          lines.concat(old_s.to_s.lines.map { |l| "- #{l.chomp}" })
+          lines.concat(new_s.to_s.lines.map { |l| "+ #{l.chomp}" })
+        end
+        if lines.size > MAX_DIFF_LINES
+          dropped = lines.size - MAX_DIFF_LINES
+          lines   = lines.first(MAX_DIFF_LINES)
+          lines << "  [… #{dropped} more line(s)]"
+        end
+        lines.join("\n")
       end
     end
   end

data/lib/rubino/tools/patch_tool.rb CHANGED Viewed

@@ -66,6 +66,11 @@ module Rubino
         hunks.each do |hunk|
           file_path = File.expand_path(hunk[:file], base_path)
+          # SECRET/credential patches (#446) are no longer HARD-refused here —
+          # they are gated UPSTREAM by Security::ApprovalPolicy#decide, which
+          # scans the patch's target paths and prompts (→ :ask) when ANY hunk
+          # touches a secret; an approved apply_patch proceeds, a denied/headless
+          # one never reaches #call. The workspace sandbox below is unchanged.
           unless within_workspace?(file_path)
             return [nil, workspace_violation_message(hunk[:file]) +
                          " (no changes applied — apply_patch is two-phase)"]

data/lib/rubino/tools/read_attachment_tool.rb CHANGED Viewed

@@ -93,7 +93,9 @@ module Rubino
                  "reads documents and text. Inspect other kinds via the shell."
         end
-        markdown = Rubino::Documents.to_markdown(cls.path, mime: cls.mime)
+        # Thread the cancel_token so a runaway/bomb conversion is interruptible
+        # mid-flight and bounded by the converter's wall-clock/element caps.
+        markdown = Rubino::Documents.to_markdown(cls.path, mime: cls.mime, cancel_token: @cancel_token)
         # No in-process converter (unknown format / optional gem absent): degrade
         # with the actionable shell-extraction hint, exactly like the preamble.
         # NEVER raise -- a missing gem must not break the turn.

data/lib/rubino/tools/read_tool.rb CHANGED Viewed

@@ -1,5 +1,7 @@
 # frozen_string_literal: true
+require "digest"
 module Rubino
   module Tools
     # Reads a file with `cat -n` style line numbers, offset/limit windowing,
@@ -49,7 +51,12 @@ module Rubino
         return "Error: file_path is required" if file_path.nil? || file_path.to_s.empty?
-        expanded = File.expand_path(file_path)
+        expanded = expand_workspace_path(file_path)
+        # Reads are BROAD (#406): like Hermes/Claude/Codex, read resolves any
+        # NON-secret path with no prompt (clone-and-inspect). A SECRET/credential
+        # path (#446) is NOT refused here anymore — it is gated UPSTREAM by
+        # Security::ApprovalPolicy#decide (→ :ask), so an APPROVED read returns
+        # the real bytes while a denied/headless read never reaches #call.
         return "Error: File not found: #{file_path}" unless File.exist?(expanded)
         return "Error: Not a regular file: #{file_path}" unless File.file?(expanded)
@@ -64,20 +71,21 @@ module Rubino
         offset = 1 if offset < 1
         limit  = DEFAULT_LIMIT if limit <= 0
-        # Stash mtime BEFORE rendering so a slow render on a huge file doesn't
-        # race with a concurrent writer — we want the mtime the model "saw",
-        # not the one at end-of-render.
-        mtime = File.mtime(expanded)
-        @read_tracker&.register(expanded, mtime)
-        # Re-reading the exact same window (same file, offset, limit, unchanged
-        # mtime) within a turn just re-injects bytes already in context. Return
-        # a short nudge instead so the conversation doesn't carry the same
-        # content twice. A real edit bumps mtime, so legitimate re-reads pass.
-        dup = @read_tracker&.register_window(expanded, offset, limit, mtime)
-        if dup && dup > 1
+        # Stash mtime + content hash BEFORE rendering so a slow render on a huge
+        # file doesn't race with a concurrent writer — we want the state the
+        # model "saw", not the one at end-of-render. The hash is the single
+        # source of truth the edit-gate and dedup both consult.
+        mtime  = File.mtime(expanded)
+        digest = Digest::SHA256.hexdigest(File.binread(expanded))
+        @read_tracker&.register(expanded, mtime, digest)
+        # Re-reading the exact same window of UNCHANGED bytes just re-injects
+        # content already in context. Skip the work with a nudge — but only when
+        # the file still hashes the same, the TTL holds, and no edit-failure
+        # recovery is pending (those serve fresh content). See ReadTracker.
+        if @read_tracker&.duplicate_read?(expanded, offset, limit, digest)
           return { output: "[DUPLICATE READ] Exact repeat of an earlier read of #{file_path} " \
-                           "(lines #{offset}-#{offset + limit - 1}) this turn — reuse that result " \
+                           "(lines #{offset}-#{offset + limit - 1}) — reuse that result " \
                            "instead of re-reading.",
                    metrics: "duplicate" }
         end
@@ -161,12 +169,22 @@ module Rubino
         last_shown  = offset - 1
         byte_capped = false
-        File.open(expanded, "r") do |io|
+        # Open as UTF-8 regardless of the process locale (#273): under a bare
+        # C/POSIX locale the default external encoding is US-ASCII, which would
+        # tag every line ASCII and force the scrub below to mangle perfectly
+        # valid UTF-8 file content. Pinning UTF-8 reads it correctly.
+        File.open(expanded, "r:UTF-8") do |io|
           io.each_line do |line|
             total_lines += 1
             next if total_lines < offset
             break if total_lines > last_line
+            # A single non-UTF-8 byte (e.g. a Latin-1 `é` in a legacy/EU
+            # source comment) would otherwise blow up `chomp`/`format` with
+            # "invalid byte sequence in UTF-8". Scrub it to the replacement
+            # char so the model can still read (and then edit) the file —
+            # lossy but graceful, instead of a blind read failure.
+            line = line.scrub unless line.valid_encoding?
             chomped = line.chomp
             chomped = chomped.byteslice(0, MAX_LINE_WIDTH) + "… [line truncated]" if chomped.bytesize > MAX_LINE_WIDTH
             out << format("%6d\t%s\n", total_lines, chomped)