RubyGems - rubino-agent - Versions diffs - 0.3.0 → 0.5.0 - Mend

rubino-agent 0.3.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

checksums.yaml +4 -4
data/.rubocop_todo.yml +11 -2
data/AGENTS.md +1 -1
data/CHANGELOG.md +172 -5
data/CONTRIBUTING.md +10 -1
data/README.md +14 -5
data/Rakefile +31 -0
data/docs/agents.md +42 -23
data/docs/architecture.md +2 -2
data/docs/commands.md +35 -3
data/docs/configuration.md +20 -23
data/docs/getting-started.md +5 -3
data/docs/security.md +16 -5
data/docs/skills.md +31 -0
data/docs/troubleshooting.md +1 -1
data/exe/rubino +16 -2
data/install.sh +721 -59
data/lib/rubino/active_agent.rb +73 -0
data/lib/rubino/agent/action_claim_guard.rb +881 -0
data/lib/rubino/agent/agent_registry.rb +5 -2
data/lib/rubino/agent/definition.rb +1 -9
data/lib/rubino/agent/fallback_chain.rb +0 -6
data/lib/rubino/agent/iteration_budget.rb +109 -3
data/lib/rubino/agent/loop.rb +476 -20
data/lib/rubino/agent/model_call_runner.rb +81 -3
data/lib/rubino/agent/prompts/build.txt +22 -5
data/lib/rubino/agent/response_validator.rb +8 -0
data/lib/rubino/agent/runner.rb +133 -8
data/lib/rubino/agent/tool_executor.rb +166 -14
data/lib/rubino/agent/truncation_continuation.rb +4 -1
data/lib/rubino/api/server.rb +19 -0
data/lib/rubino/attachments/classify.rb +35 -17
data/lib/rubino/boot/config_guard.rb +71 -0
data/lib/rubino/cli/chat/completion_builder.rb +42 -6
data/lib/rubino/cli/chat/idle_card_host.rb +7 -1
data/lib/rubino/cli/chat/session_resolver.rb +87 -21
data/lib/rubino/cli/chat_command.rb +1189 -50
data/lib/rubino/cli/commands.rb +282 -2
data/lib/rubino/cli/config_command.rb +68 -8
data/lib/rubino/cli/doctor_command.rb +204 -12
data/lib/rubino/cli/jobs_command.rb +12 -0
data/lib/rubino/cli/memory_command.rb +53 -20
data/lib/rubino/cli/onboarding_wizard.rb +79 -6
data/lib/rubino/cli/session_command.rb +172 -18
data/lib/rubino/cli/setup_command.rb +131 -8
data/lib/rubino/cli/skills_command.rb +183 -9
data/lib/rubino/cli/trust_gate.rb +16 -7
data/lib/rubino/commands/built_ins.rb +2 -0
data/lib/rubino/commands/command.rb +12 -2
data/lib/rubino/commands/executor.rb +149 -12
data/lib/rubino/commands/handlers/agent_switch.rb +100 -0
data/lib/rubino/commands/handlers/agents.rb +156 -41
data/lib/rubino/commands/handlers/config.rb +4 -1
data/lib/rubino/commands/handlers/help.rb +113 -14
data/lib/rubino/commands/handlers/memory.rb +15 -5
data/lib/rubino/commands/handlers/sessions.rb +26 -3
data/lib/rubino/commands/handlers/status.rb +9 -4
data/lib/rubino/commands/loader.rb +12 -0
data/lib/rubino/config/configuration.rb +86 -24
data/lib/rubino/config/defaults.rb +140 -33
data/lib/rubino/config/loader.rb +62 -12
data/lib/rubino/config/validator.rb +341 -0
data/lib/rubino/config/writer.rb +123 -31
data/lib/rubino/context/compressor.rb +184 -22
data/lib/rubino/context/environment_inspector.rb +2 -2
data/lib/rubino/context/file_discovery.rb +2 -2
data/lib/rubino/context/message_boundary.rb +27 -1
data/lib/rubino/context/project_languages.rb +90 -0
data/lib/rubino/context/prompt_assembler.rb +105 -22
data/lib/rubino/context/summary_builder.rb +45 -4
data/lib/rubino/context/token_budget.rb +36 -11
data/lib/rubino/context/token_estimate.rb +45 -0
data/lib/rubino/context/tool_result_pruner.rb +81 -0
data/lib/rubino/database/connection.rb +154 -3
data/lib/rubino/database/migrations/001_create_initial_schema.rb +314 -40
data/lib/rubino/database/migrator.rb +98 -5
data/lib/rubino/documents/cap_exceeded.rb +13 -0
data/lib/rubino/documents/converters/csv.rb +4 -3
data/lib/rubino/documents/converters/docx.rb +29 -5
data/lib/rubino/documents/converters/html.rb +5 -1
data/lib/rubino/documents/converters/json.rb +2 -1
data/lib/rubino/documents/converters/pdf.rb +11 -2
data/lib/rubino/documents/converters/plain.rb +2 -1
data/lib/rubino/documents/converters/pptx.rb +11 -2
data/lib/rubino/documents/converters/xlsx.rb +35 -4
data/lib/rubino/documents/converters/xml.rb +2 -1
data/lib/rubino/documents/limits.rb +210 -0
data/lib/rubino/documents.rb +10 -3
data/lib/rubino/errors.rb +36 -5
data/lib/rubino/interaction/cancel_token.rb +19 -3
data/lib/rubino/interaction/events.rb +13 -0
data/lib/rubino/interaction/lifecycle.rb +99 -13
data/lib/rubino/interaction/polishing.rb +176 -0
data/lib/rubino/jobs/cron_job_repository.rb +5 -8
data/lib/rubino/jobs/handlers/cleanup_sessions_job.rb +11 -0
data/lib/rubino/jobs/handlers/distill_skill_job.rb +65 -9
data/lib/rubino/jobs/queue.rb +63 -8
data/lib/rubino/jobs/runner.rb +24 -6
data/lib/rubino/jobs/worker.rb +0 -4
data/lib/rubino/llm/adapter_response.rb +47 -4
data/lib/rubino/llm/credential_check.rb +15 -16
data/lib/rubino/llm/error_classifier.rb +89 -1
data/lib/rubino/llm/inline_think_filter.rb +69 -12
data/lib/rubino/llm/request.rb +30 -3
data/lib/rubino/llm/ruby_llm_adapter.rb +394 -46
data/lib/rubino/llm/tool_bridge.rb +113 -9
data/lib/rubino/mcp/manager.rb +18 -1
data/lib/rubino/mcp/mcp_tool_wrapper.rb +14 -3
data/lib/rubino/memory/aux_retry.rb +107 -0
data/lib/rubino/memory/backends/sqlite.rb +73 -44
data/lib/rubino/memory/backends.rb +23 -7
data/lib/rubino/memory/salience_gate.rb +103 -0
data/lib/rubino/memory/sqlite_extraction.rb +70 -0
data/lib/rubino/memory/sqlite_extraction_prompt.rb +11 -0
data/lib/rubino/memory/store.rb +33 -5
data/lib/rubino/memory/threat_scanner.rb +52 -0
data/lib/rubino/output/cost.rb +52 -0
data/lib/rubino/output/headless_block_latch.rb +53 -0
data/lib/rubino/output/result_serializer.rb +222 -0
data/lib/rubino/output/turn_recorder.rb +77 -0
data/lib/rubino/security/approval_policy.rb +227 -32
data/lib/rubino/security/command_allowlist.rb +79 -4
data/lib/rubino/security/doom_loop_detector.rb +21 -2
data/lib/rubino/security/hardline_guard.rb +189 -16
data/lib/rubino/security/pattern_matcher.rb +28 -5
data/lib/rubino/security/prefix_deriver.rb +25 -6
data/lib/rubino/security/readonly_commands.rb +145 -5
data/lib/rubino/security/secret_path.rb +134 -0
data/lib/rubino/security/url_safety.rb +255 -0
data/lib/rubino/session/repository.rb +212 -11
data/lib/rubino/session/store.rb +139 -14
data/lib/rubino/skills/installer.rb +230 -0
data/lib/rubino/skills/prompt_index.rb +2 -2
data/lib/rubino/skills/registry.rb +52 -1
data/lib/rubino/skills/skill.rb +64 -3
data/lib/rubino/skills/skill_tool.rb +16 -5
data/lib/rubino/tools/background_tasks.rb +157 -13
data/lib/rubino/tools/base.rb +204 -3
data/lib/rubino/tools/edit_tool.rb +73 -18
data/lib/rubino/tools/glob_tool.rb +48 -9
data/lib/rubino/tools/grep_tool.rb +103 -9
data/lib/rubino/tools/multi_edit_tool.rb +64 -9
data/lib/rubino/tools/patch_tool.rb +5 -0
data/lib/rubino/tools/read_attachment_tool.rb +3 -1
data/lib/rubino/tools/read_tool.rb +33 -15
data/lib/rubino/tools/read_tracker.rb +153 -35
data/lib/rubino/tools/registry.rb +113 -12
data/lib/rubino/tools/result.rb +9 -1
data/lib/rubino/tools/ruby_tool.rb +0 -0
data/lib/rubino/tools/shell_registry.rb +70 -0
data/lib/rubino/tools/shell_tool.rb +40 -1
data/lib/rubino/tools/summarize_file_tool.rb +6 -0
data/lib/rubino/tools/task_stop_tool.rb +10 -16
data/lib/rubino/tools/task_tool.rb +36 -8
data/lib/rubino/tools/vision_tool.rb +5 -0
data/lib/rubino/tools/webfetch_tool.rb +39 -7
data/lib/rubino/tools/websearch_tool.rb +92 -30
data/lib/rubino/tools/write_tool.rb +23 -4
data/lib/rubino/ui/api.rb +10 -1
data/lib/rubino/ui/base.rb +11 -0
data/lib/rubino/ui/bottom_composer.rb +382 -74
data/lib/rubino/ui/cli.rb +515 -83
data/lib/rubino/ui/completion_menu.rb +11 -7
data/lib/rubino/ui/headless_trace.rb +63 -0
data/lib/rubino/ui/live_region.rb +70 -7
data/lib/rubino/ui/markdown_renderer.rb +142 -7
data/lib/rubino/ui/notifier.rb +0 -2
data/lib/rubino/ui/null.rb +52 -5
data/lib/rubino/ui/paste_store.rb +16 -2
data/lib/rubino/ui/queued_indicators.rb +6 -1
data/lib/rubino/ui/status_bar.rb +61 -7
data/lib/rubino/ui/streaming_markdown.rb +59 -6
data/lib/rubino/ui/subagent_view.rb +29 -4
data/lib/rubino/ui/tool_label.rb +52 -0
data/lib/rubino/update_check.rb +39 -4
data/lib/rubino/util/atomic_file.rb +117 -0
data/lib/rubino/util/ignore_rules.rb +120 -0
data/lib/rubino/util/output.rb +229 -12
data/lib/rubino/util/secrets_mask.rb +70 -7
data/lib/rubino/util/spill_store.rb +153 -0
data/lib/rubino/version.rb +1 -1
data/lib/rubino/workspace.rb +9 -1
data/lib/rubino.rb +191 -7
data/rubino-agent.gemspec +1 -0
data/skills/ruby-expert/SKILL.md +1 -0
metadata +42 -12
data/lib/rubino/agent/router.rb +0 -65
data/lib/rubino/database/migrations/002_create_runs.rb +0 -45
data/lib/rubino/database/migrations/003_create_skill_states.rb +0 -15
data/lib/rubino/database/migrations/004_create_cron_jobs.rb +0 -36
data/lib/rubino/database/migrations/005_create_oauth_connections.rb +0 -27
data/lib/rubino/database/migrations/006_create_webhook_deliveries.rb +0 -34
data/lib/rubino/database/migrations/007_create_messages_fts.rb +0 -59
data/lib/rubino/database/migrations/008_create_memory_facts.rb +0 -75
data/lib/rubino/database/migrations/009_create_memory_graph.rb +0 -55
data/lib/rubino/database/migrations/010_add_owner_pid_to_sessions.rb +0 -20

data/lib/rubino/security/approval_policy.rb CHANGED Viewed

@@ -16,6 +16,20 @@ module Rubino
     class ApprovalPolicy
       MODES = %w[manual auto skip].freeze
+      # Structured in-workspace file-edit tools. Under dangerous_only these run
+      # unprompted — SYMMETRIC with safe shell — because the always-on #413
+      # write-denylist + workspace sandbox (both enforced inside the tool's
+      # #call, regardless of approval) are the boundary, not a per-edit prompt
+      # (#427, mirrors Hermes file_safety + Claude Code acceptEdits / Codex
+      # auto-edit / aider).
+      STRUCTURED_EDIT_TOOLS = %w[edit write multi_edit apply_patch].freeze
+      # File tools whose TARGET path is run through the unified secret-file gate
+      # (#446). READ side resolves the path from `file_path`/`path`; WRITE side
+      # from `file_path` (apply_patch from its patch text, see #secret_file_access?).
+      SECRET_GATED_READ_TOOLS  = %w[read grep glob].freeze
+      SECRET_GATED_WRITE_TOOLS = STRUCTURED_EDIT_TOOLS
       # Why the most recent #decide returned :deny — :hardline (the
       # non-bypassable floor), :permission_rule (an explicit permissions deny
       # rule), or :doom_loop (the repeated-identical-call guard). nil when the
@@ -27,18 +41,34 @@ module Rubino
       def initialize(config: nil, agent_overrides: nil)
         @config = config || Rubino.configuration
         @mode = @config.approvals_mode
-        # Effective shell prompt policy (:confirm_all | :dangerous_only).
-        # Derived from security.confirm_policy, with security.require_confirmation_for_shell
-        # as a back-compat alias (see Configuration#confirm_policy). Older config
-        # objects that predate the accessor fall back to :confirm_all.
+        # Effective shell prompt policy (:confirm_all | :dangerous_only), the
+        # SOLE source of truth (item 7): security.confirm_policy only — the legacy
+        # security.require_confirmation_for_shell alias was removed (see
+        # Configuration#confirm_policy). Older config objects that predate the
+        # accessor fall back to the reference-faithful :dangerous_only default.
         @confirm_policy =
-          @config.respond_to?(:confirm_policy) ? @config.confirm_policy : :confirm_all
+          @config.respond_to?(:confirm_policy) ? @config.confirm_policy : :dangerous_only
         @pattern_matcher = PatternMatcher.new(
           rules: load_permission_rules(agent_overrides)
         )
-        @doom_detector = DoomLoopDetector.new
+        # Doom-loop guard, config-driven (#414). Default WARN-not-block with a
+        # higher threshold (Hermes tool_guardrails alignment): a tripped detector
+        # under hard_stop:false surfaces a warning but lets the call run.
+        @doom_detector = DoomLoopDetector.new(
+          threshold: @config.respond_to?(:doom_loop_threshold) ? @config.doom_loop_threshold : DoomLoopDetector::DEFAULT_THRESHOLD,
+          hard_stop: @config.respond_to?(:doom_loop_hard_stop?) ? @config.doom_loop_hard_stop? : false
+        )
+        # Set true after a warn-mode doom-loop hit so ToolExecutor can surface a
+        # one-time warning to the model without denying the call. Cleared each
+        # #decide and on reset_turn!.
+        @doom_loop_warning = false
       end
+      # True when the LAST #decide tripped the doom-loop guard in WARN mode
+      # (hard_stop off): the call was allowed but the model should be told it is
+      # repeating an identical call. ToolExecutor reads this to attach a warning.
+      attr_reader :doom_loop_warning
       # Returns the decision for a tool call: :allow, :ask, :deny
       #
       # CANONICAL DECISION ORDER (deny-class checks precede every allow path).
@@ -46,14 +76,22 @@ module Rubino
       #
       #   1. hardline(:deny)            non-bypassable floor BELOW yolo
       #   2. permissions:deny           an explicit deny rule also beats yolo
-      #   3. yolo / skip-approvals      allow-exit (doom still guards it)
+      #   3. runtime yolo (Modes)      allow-exit (doom still guards it).
+      #                                 config approvals.mode: "skip" does NOT
+      #                                 take this exit — it is not a headless
+      #                                 yolo (see steps 7-9 / #260).
       #   4. doom loop                  break a stuck autopilot
       #   5. permissions:allow / :ask   remaining explicit rules
-      #   6. command_allowlist (prefix) pre-approved commands -> :allow
+      #   6. command_allowlist          pre-approved EXACT commands -> :allow
+      #                                 (chain-aware, token-boundary; never a
+      #                                 prefix of a compound line)
       #   6b. readonly auto-allow       parse-validated read-only shell -> :allow
       #   7-8. confirm_policy shell gate  confirm_all -> :ask; dangerous_only
-      #                                 -> :ask only if dangerous?, else :allow
-      #   9. mode fallback
+      #                                 -> :ask only if dangerous?, else :allow.
+      #                                 Runs for mode "skip" too, so a write/
+      #                                 shell under config "skip" still reaches
+      #                                 the headless fail-closed floor (#260).
+      #   9. mode fallback             ("skip" -> :ask for risky tools, not :allow)
       #
       # The invariant that makes this slice worth doing: HARDLINE and an
       # explicit permissions:deny BOTH run before any allow path (yolo,
@@ -61,6 +99,7 @@ module Rubino
       # by a fast-path the way yolo used to override deny rules.
       def decide(tool, arguments: {})
         @last_deny_reason = nil
+        @doom_loop_warning = false
         command_str = self.class.command_string(tool, arguments)
         # 1. Hardline floor — a floor BELOW yolo. Catastrophic, unrecoverable
@@ -87,20 +126,36 @@ module Rubino
         #    run the doom detector AFTER, because an autopilot stuck in a loop
         #    is the one thing yolo isn't supposed to license.
         if Rubino::Modes.skip_approvals?
-          return deny_with(:doom_loop) if @doom_detector.record(tool_name: tool.name, arguments: arguments)
+          return deny_with(:doom_loop) if doom_loop_blocks?(tool, arguments)
           return :allow
         end
-        # 4. Doom loop guard.
-        if @doom_detector.record(tool_name: tool.name, arguments: arguments)
-          return deny_with(:doom_loop) # Break the loop
-        end
+        # 4. Doom loop guard. Blocks only under hard_stop (#414); in the default
+        #    warn mode it sets @doom_loop_warning and falls through to the normal
+        #    decision so a legitimate repeated call is not hard-denied.
+        return deny_with(:doom_loop) if doom_loop_blocks?(tool, arguments)
         # 5. Remaining explicit pattern rules (allow / ask). deny was already
-        #    handled in step 2.
+        #    handled in step 2. An explicit user permissions rule (allow/ask)
+        #    wins over the secret gate below, so a user who wrote
+        #    `read /path/.env: allow` is honored.
         return pattern_result if pattern_result
+        # 5b. UNIFIED SECRET-FILE GATE (#446). Reading (read/grep/glob) OR
+        #     writing/editing (write/edit/multi_edit/apply_patch) a SECRET path
+        #     requires EXPLICIT user approval — the maintainer decision: not a
+        #     silent allow, not a silent hard-block. Returns :ask, which the
+        #     ToolExecutor turns into the approval dropdown when interactive
+        #     (approved → the tool runs and reads/writes the secret; denied →
+        #     refused) and into a FAIL-CLOSED block when headless (:noninteractive).
+        #     Runs ABOVE the broad read/allow fast-paths (steps 6/6b/9) so a
+        #     secret read isn't silently auto-allowed, and BELOW yolo (step 3) so
+        #     a --yolo operator who opted into full file trust isn't re-prompted.
+        #     NON-secret reads stay broad (clone-and-inspect, #406) — only the
+        #     secret set is gated.
+        return :ask if secret_file_access?(tool, arguments)
         # 6. Config allowlist of pre-approved commands. Checked AFTER deny
         #    patterns (deny always wins) but BEFORE mode-based decision so a
         #    listed command never triggers a manual prompt.
@@ -114,32 +169,70 @@ module Rubino
         #    validator cannot prove read-only falls through to the prompt.
         return :allow if readonly_auto_allowed?(tool, command_str)
+        # 6c. skill(action: "create") WRITES <RUBINO_HOME>/skills/<name>/SKILL.md
+        #    and must not be a silent low-risk allow (#405): the skill tool stays
+        #    :low so a read_only agent keeps `skill load/list/show`, but the
+        #    create action is a write and routes to :ask here — like any write.
+        #    Below yolo (step 3), so a full-access --yolo agent still creates
+        #    skills inline; a headless read_only subagent's :ask becomes the
+        #    fail-closed block, closing the unapproved-write path. load is never
+        #    gated (only the create action matches).
+        #
+        #    This gate is now a real boundary, not theater (SK-2): authored
+        #    skills are written under the agent HOME (outside the cwd workspace),
+        #    so the model can't sidestep it by emitting a plain `write` of the
+        #    same SKILL.md — the workspace sandbox (within_workspace?) refuses any
+        #    write outside the workspace, leaving this :ask-gated helper as the
+        #    ONLY way to author a skill.
+        return :ask if skill_create?(tool, arguments)
         # 7-8. confirm_policy gate for a shell command not otherwise resolved.
-        #    NOT under config "skip" (nor runtime yolo, handled at step 3) —
-        #    those are the explicit operator overrides that mean "stop
-        #    prompting me".
+        #    NOT under runtime yolo (handled at step 3) — that is the explicit
+        #    CLI operator override that means "stop prompting me".
         #
-        #    confirm_all (DEFAULT, == legacy require_confirmation_for_shell:true)
+        #    config approvals.mode: "skip" is NOT given the same allow-exit as
+        #    runtime yolo here. #260 deliberately made the headless skip a
+        #    CLI-only opt-in (--yolo): a config-file "skip" must NOT silently
+        #    auto-run write/shell in a headless session. So a not-otherwise-
+        #    resolved shell command still routes through this gate to :ask, and
+        #    the ToolExecutor's headless fail-closed floor (#260) turns that
+        #    :ask into a block when there is no interactive session. Interactive
+        #    sessions still get a prompt — same as auto/manual. (Reads are
+        #    already auto-allowed by step 6b / mode_based_decision, so this
+        #    only constrains the write/shell side.)
+        #
+        #    confirm_all (opt-in hardening)
         #      every such shell command -> :ask. shell is :high risk so manual
         #      mode would ask anyway; this also keeps it gated under auto mode.
         #
-        #    dangerous_only (reference-faithful, == legacy alias:false)
+        #    dangerous_only (DEFAULT, reference-faithful)
         #      prompt ONLY when the command matches a DangerousPattern
         #      (git push --force, curl|sh, recursive rm of a non-root path,
         #      ...). Safe commands run unprompted. Mirrors approval.py:475
         #      where detect_dangerous_command is the sole prompt trigger.
         #      The hardline floor (step 1) and permissions:deny (step 2) already
         #      ran, so dangerous_only NEVER weakens the non-bypassable floor.
-        if tool.name == "shell" && @mode != "skip"
-          case @confirm_policy
-          when :dangerous_only
-            return :ask if dangerous?(command_str)
-            return :allow
-          else # :confirm_all
-            return :ask
-          end
-        end
+        return shell_confirm_decision(command_str) if tool.name == "shell"
+        # 8b. Structured in-workspace edit symmetry (#427). Under dangerous_only,
+        #    a safe `shell sed -i …` / `echo > file` runs UNPROMPTED (step 7-8),
+        #    but the structured edit/write/multi_edit/apply_patch tools are
+        #    :medium and would fall through to step 9 -> :ask, which fails closed
+        #    headless. That asymmetry pushes automation AWAY from the clean,
+        #    read-tracked, diff-producing structured tools and TOWARD raw shell
+        #    mutation — worse for safety/observability and the inverse of the
+        #    industry norm (Hermes runs structured in-workspace edits unprompted
+        #    with file_safety.is_write_denied as the boundary; Claude Code
+        #    acceptEdits, Codex auto-edit and aider all treat in-workspace edits
+        #    as LOWER friction than shell). So under dangerous_only these
+        #    structured edits are non-prompting too — SYMMETRIC with safe shell.
+        #    This NEVER widens reach: the always-on #413 write-denylist (refuses
+        #    .env/.ssh/.aws/etc even inside the workspace) and the workspace
+        #    sandbox both run inside the tool's #call regardless of approval, and
+        #    the hardline floor (step 1), permissions:deny (step 2) and
+        #    skill-create gate (step 6c) all already ran above. confirm_all
+        #    (non-default) still routes them through step 9 -> :ask unchanged.
+        return :allow if @confirm_policy == :dangerous_only && STRUCTURED_EDIT_TOOLS.include?(tool.name)
         # 9. Fall back to mode-based decision
         mode_based_decision(tool)
@@ -159,6 +252,78 @@ module Rubino
         CommandAllowlist.new(config: @config).allowed?(command)
       end
+      # True when this is the WRITE action of the skill tool (action: "create").
+      # The skill tool is :low (so read_only keeps load/list/show), but its
+      # create action writes a SKILL.md and must be approval-gated (#405).
+      def skill_create?(tool, arguments)
+        return false unless tool.name == "skill"
+        args = arguments || {}
+        (args["action"] || args[:action]).to_s == "create"
+      end
+      # The confirm_policy shell gate (steps 7-8), extracted so #decide stays
+      # under the complexity limit. confirm_all → always :ask; dangerous_only →
+      # :ask only for a DangerousPattern, else :allow.
+      def shell_confirm_decision(command_str)
+        return :ask unless @confirm_policy == :dangerous_only
+        dangerous?(command_str) ? :ask : :allow
+      end
+      # True when this call READS or WRITES a secret/credential path and so must
+      # be approval-gated (#446). For the path-arg tools (read/grep/glob/write/
+      # edit/multi_edit) the single target is resolved from file_path/path; for
+      # apply_patch every target file in the patch is checked, because one call
+      # can touch many files. Resolution is relative to the workspace primary
+      # root so a relative `.env` resolves to the same file the tool will open.
+      def secret_file_access?(tool, arguments)
+        return false unless SECRET_GATED_READ_TOOLS.include?(tool.name) ||
+                            SECRET_GATED_WRITE_TOOLS.include?(tool.name)
+        secret_targets(tool, arguments).any? { |p| SecretPath.secret?(p) }
+      end
+      # The absolute path(s) a file tool will touch. apply_patch yields one per
+      # hunk target; every other gated tool yields its single file_path/path.
+      def secret_targets(tool, arguments)
+        args = arguments || {}
+        if tool.name == "apply_patch"
+          base = (args["base_path"] || args[:base_path]).to_s
+          base = Tools::Base.workspace_root if base.empty?
+          return patch_target_paths(args["patch"] || args[:patch], base)
+        end
+        raw = self.class.command_string(tool, arguments)
+        return [] if raw.to_s.empty?
+        [resolve_workspace_path(raw)]
+      end
+      # Extracts every destination file from a unified diff (`+++ b/<file>`, and
+      # `--- a/<file>` so a delete of a secret is gated too), absolutised against
+      # base_path. A `/dev/null` side carries no file and is skipped.
+      def patch_target_paths(patch, base_path)
+        return [] if patch.nil?
+        patch.to_s.each_line.filter_map do |line|
+          m = line.match(%r{^[-+]{3} [ab]/(.+)\s*$})
+          next if m.nil?
+          File.expand_path(m[1].strip, base_path)
+        end.uniq
+      end
+      # Anchors a relative path at the workspace primary root (matching
+      # Tools::Base#expand_workspace_path) so the gate sees the same target the
+      # tool will. Absolute/~ paths pass through.
+      def resolve_workspace_path(path)
+        str = path.to_s
+        return File.expand_path(str) if str.start_with?(File::SEPARATOR, "~")
+        File.expand_path(str, Tools::Base.workspace_root)
+      end
       # True when the shell command is provably read-only and the
       # approvals.auto_allow_readonly gate (default ON) is open. Shell-only:
       # for every other tool the "command" is a path or argument fragment.
@@ -180,8 +345,18 @@ module Rubino
           (args["command"] || args[:command]).to_s
         when "read", "write", "edit", "multi_edit", "attach_file"
           (args["file_path"] || args[:file_path]).to_s
+        when "grep", "glob"
+          # The SEARCH ROOT (a dir or a file) is what the secret gate resolves —
+          # `pattern` is the regex/glob, not a path. (Default "." like the tools.)
+          (args["path"] || args[:path] || ".").to_s
         when "shell_output", "shell_kill", "shell_input"
           (args["run_id"] || args[:run_id]).to_s
+        when "skill"
+          # "<action> <name>" so the approval scope distinguishes a create from
+          # a load and one skill name from another (granularity parity, #405).
+          action = args["action"] || args[:action] || "load"
+          name   = args["name"] || args[:name]
+          [action, name].join(" ").strip
         else
           args.values.first.to_s
         end
@@ -194,6 +369,21 @@ module Rubino
       private
+      # Records the tool call in the doom detector and returns true ONLY when it
+      # tripped AND the guard is in hard_stop mode (=> block). In the default
+      # warn mode a trip sets @doom_loop_warning and returns false, so the call
+      # proceeds through the normal decision path (#414).
+      def doom_loop_blocks?(tool, arguments)
+        return false unless @doom_detector.record(tool_name: tool.name, arguments: arguments)
+        if @doom_detector.hard_stop?
+          true
+        else
+          @doom_loop_warning = true
+          false
+        end
+      end
       # Records WHY this deny fired before returning it (see #last_deny_reason).
       def deny_with(reason)
         @last_deny_reason = reason
@@ -202,8 +392,13 @@ module Rubino
       def mode_based_decision(tool)
         case @mode
+        # config approvals.mode: "skip" is NOT a headless yolo (#260). It stays
+        # permissive for non-risky tools (reads), but a risky tool (write/edit/
+        # shell) routes to :ask so the headless fail-closed floor can block it
+        # when there is no interactive session — only runtime --yolo (step 3)
+        # may auto-run those headless. Interactive sessions still get a prompt.
         when "skip"
-          :allow
+          tool.risky? ? :ask : :allow
         when "auto"
           tool.risk_level == :high ? :ask : :allow
         when "manual"

data/lib/rubino/security/command_allowlist.rb CHANGED Viewed

@@ -1,24 +1,99 @@
 # frozen_string_literal: true
+require "shellwords"
 module Rubino
   module Security
-    # Manages a whitelist of shell commands that can be executed without confirmation.
+    # Manages a whitelist of shell commands that can be executed without
+    # confirmation.
+    #
+    # An allowlist entry pre-approves an EXACT single command, never a prefix
+    # of a larger compound line. A naive `start_with?` (the old behaviour) let
+    # any line whose head matched an entry auto-resolve to :allow — INCLUDING
+    # the chained tail: with `git status` allowlisted,
+    # `git status; echo k >> ~/.ssh/authorized_keys` resolved to :allow,
+    # turning a read-only pre-approval into headless RCE/exfil. So this matcher
+    # is chain-aware, mirroring ReadonlyCommands:
+    #
+    #   - DangerousPatterns runs FIRST on the whole line, so a dangerous tail
+    #     (curl|sh, recursive rm, write into ~/.ssh, ...) can never be beaten
+    #     by an allowlisted head;
+    #   - the line is split into chain segments (|, ||, &&, ;, newline) with the
+    #     same quote-aware splitter as ReadonlyCommands, which REJECTS the line
+    #     outright on redirection (>), backgrounding (&), command substitution
+    #     ($(...) / backticks) or process substitution (<(...) / >()) — the
+    #     constructs that smuggle a write or an execution past a head check;
+    #   - EVERY segment must match an allowlist entry, and a match is on a TOKEN
+    #     boundary (a prefix of token tokens), never a bare substring: `git`
+    #     allowlisted does NOT pre-approve `git-secret-leak`, and `git status`
+    #     does NOT pre-approve `git statusxyz`;
+    #   - a matched head is FLAG-VETTED via ReadonlyCommands: an allowlisted
+    #     read-capable head can not smuggle a write/exec flag past the prefix
+    #     match. With `git diff` allowlisted, `git diff --output /tmp/PWN`
+    #     (an arbitrary write) is REJECTED — same for `git diff -O...`,
+    #     `find -exec/-delete/-fprintf`, `date -s`, `tree -o` (SEC-1).
     class CommandAllowlist
       def initialize(config: nil)
         @config = config || Rubino.configuration
         @allowlist = @config.security_command_allowlist
       end
-      # Returns true if the command matches an entry in the allowlist.
+      # Returns true ONLY when the ENTIRE command line is covered by the
+      # allowlist: not dangerous, splits cleanly into chain segments, and every
+      # segment's head matches an allowlist entry on a token boundary.
+      #
       # An EMPTY allowlist matches NOTHING — pre-approval is opt-in, so an
       # unconfigured allowlist must never auto-approve everything.
       def allowed?(command)
         return false if @allowlist.empty?
+        return false if DangerousPatterns.dangerous?(command)
+        entries = allowlist_token_lists
+        return false if entries.empty?
+        segments = ReadonlyCommands.split_segments(command.to_s)
+        return false if segments.nil? || segments.empty?
+        segments.all? { |segment| segment_allowed?(segment, entries) }
+      end
-        @allowlist.any? do |allowed|
-          command.strip.start_with?(allowed.strip)
+      private
+      # Each allowlist entry as its token list (e.g. "bundle exec rspec" ->
+      # %w[bundle exec rspec]). Empty / blank entries are dropped so a stray ""
+      # in the config can't match every command.
+      def allowlist_token_lists
+        @allowlist.filter_map do |entry|
+          tokens = Shellwords.split(entry.to_s)
+          tokens unless tokens.empty?
+        rescue ArgumentError
+          nil # an entry that won't tokenize (unbalanced quote) can't match
         end
       end
+      # A single chain segment is allowed when its leading tokens exactly match
+      # some allowlist entry's tokens AND it carries no write/exec flag that
+      # would turn a matched read-capable head into an arbitrary write or
+      # execution. Matching on the token list (not the raw string) makes it
+      # boundary-safe: `git status` matches `git status -s` but never
+      # `git statusxyz`.
+      #
+      # Flag vetting reuses ReadonlyCommands' dangerous-flag logic so the
+      # allowlist and the read-only auto-allow agree on what `git --output`,
+      # `find -exec/-delete/-fprintf`, `date -s`, `tree -o` mean: a head being
+      # on the allowlist pre-approves the COMMAND, never a smuggled output/exec
+      # flag (SEC-1 — `git diff --output FILE` arbitrary write).
+      def segment_allowed?(segment, entries)
+        tokens = Shellwords.split(segment)
+        return false if tokens.empty?
+        matched = entries.any? { |entry_tokens| tokens.first(entry_tokens.length) == entry_tokens }
+        return false unless matched
+        !ReadonlyCommands.dangerous_flags?(tokens)
+      rescue ArgumentError
+        false # unbalanced quotes etc. — fall through to the prompt
+      end
     end
   end
 end

data/lib/rubino/security/doom_loop_detector.rb CHANGED Viewed

@@ -4,15 +4,34 @@ module Rubino
   module Security
     # Detects when the agent enters a doom loop - repeatedly calling
     # the same tool with identical arguments without progress.
+    #
+    # Two dimensions, both config-driven (Hermes tool_guardrails alignment,
+    # #414):
+    #   - threshold: how many identical consecutive calls trip detection
+    #     (default 5; Hermes grades 5-8). The old default was 3, which hard-
+    #     denied a legitimate 3rd retry of an idempotent read.
+    #   - hard_stop: when true, a tripped detector means BLOCK (the policy
+    #     returns :deny). When false (the default) it WARNS but allows — the
+    #     policy surfaces a one-time warning to the model and lets the call run.
     class DoomLoopDetector
-      DEFAULT_THRESHOLD = 3
+      DEFAULT_THRESHOLD = 5
-      def initialize(threshold: DEFAULT_THRESHOLD)
+      attr_reader :threshold
+      def initialize(threshold: DEFAULT_THRESHOLD, hard_stop: false)
         @threshold = threshold
+        @hard_stop = hard_stop
         @history = []
       end
+      # True when the detector is configured to BLOCK on detection (vs. warn).
+      def hard_stop?
+        @hard_stop == true
+      end
       # Records a tool call and returns true if a doom loop is detected
+      # (the last `threshold` calls are identical). Detection is independent
+      # of hard_stop — the caller decides whether a hit blocks or only warns.
       def record(tool_name:, arguments:)
         signature = generate_signature(tool_name, arguments)
         @history << signature