RubyGems - rubino-agent - Versions diffs - 0.3.0 - Mend

rubino-agent 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (376) hide show

checksums.yaml +7 -0
data/.rspec +3 -0
data/.rubocop.yml +115 -0
data/.rubocop_todo.yml +955 -0
data/.ruby-version +1 -0
data/AGENTS.md +97 -0
data/CHANGELOG.md +344 -0
data/CONTRIBUTING.md +69 -0
data/LICENSE +21 -0
data/README.md +200 -0
data/Rakefile +8 -0
data/docs/agents.md +190 -0
data/docs/api/v1.md +414 -0
data/docs/architecture.md +177 -0
data/docs/commands.md +375 -0
data/docs/configuration.md +590 -0
data/docs/getting-started.md +143 -0
data/docs/jobs.md +332 -0
data/docs/mcp.md +128 -0
data/docs/memory.md +98 -0
data/docs/models-and-keys.md +173 -0
data/docs/oauth-providers.md +145 -0
data/docs/plugins.md +195 -0
data/docs/security.md +145 -0
data/docs/skills.md +322 -0
data/docs/tools.md +395 -0
data/docs/troubleshooting.md +73 -0
data/exe/rubino +9 -0
data/install.sh +275 -0
data/lib/rubino/active_skill.rb +50 -0
data/lib/rubino/agent/agent_registry.rb +120 -0
data/lib/rubino/agent/backoff_policy.rb +116 -0
data/lib/rubino/agent/definition.rb +128 -0
data/lib/rubino/agent/degenerate_recovery.rb +271 -0
data/lib/rubino/agent/fallback_chain.rb +194 -0
data/lib/rubino/agent/iteration_budget.rb +50 -0
data/lib/rubino/agent/loop.rb +617 -0
data/lib/rubino/agent/model_call_runner.rb +383 -0
data/lib/rubino/agent/prompts/build.txt +69 -0
data/lib/rubino/agent/prompts/compaction.txt +20 -0
data/lib/rubino/agent/prompts/explore.txt +19 -0
data/lib/rubino/agent/prompts/general.txt +20 -0
data/lib/rubino/agent/prompts/plan.txt +31 -0
data/lib/rubino/agent/response_validator.rb +70 -0
data/lib/rubino/agent/router.rb +65 -0
data/lib/rubino/agent/runner.rb +195 -0
data/lib/rubino/agent/tool_executor.rb +402 -0
data/lib/rubino/agent/truncation_continuation.rb +137 -0
data/lib/rubino/api/middleware/auth.rb +43 -0
data/lib/rubino/api/middleware/error_handler.rb +65 -0
data/lib/rubino/api/middleware/json_parser.rb +100 -0
data/lib/rubino/api/middleware/observability.rb +59 -0
data/lib/rubino/api/middleware/rate_limit.rb +136 -0
data/lib/rubino/api/operations/approvals/decide_operation.rb +49 -0
data/lib/rubino/api/operations/clarifications/decide_operation.rb +44 -0
data/lib/rubino/api/operations/cron_jobs/create_operation.rb +46 -0
data/lib/rubino/api/operations/cron_jobs/delete_operation.rb +36 -0
data/lib/rubino/api/operations/cron_jobs/list_operation.rb +55 -0
data/lib/rubino/api/operations/cron_jobs/pause_operation.rb +34 -0
data/lib/rubino/api/operations/cron_jobs/resume_operation.rb +34 -0
data/lib/rubino/api/operations/cron_jobs/schedule_validation.rb +30 -0
data/lib/rubino/api/operations/cron_jobs/show_operation.rb +32 -0
data/lib/rubino/api/operations/cron_jobs/trigger_operation.rb +38 -0
data/lib/rubino/api/operations/cron_jobs/update_operation.rb +42 -0
data/lib/rubino/api/operations/files/read_operation.rb +40 -0
data/lib/rubino/api/operations/files/upload_operation.rb +175 -0
data/lib/rubino/api/operations/health_operation.rb +46 -0
data/lib/rubino/api/operations/memory/delete_operation.rb +32 -0
data/lib/rubino/api/operations/memory/index_operation.rb +80 -0
data/lib/rubino/api/operations/memory/stats_operation.rb +28 -0
data/lib/rubino/api/operations/metrics_operation.rb +18 -0
data/lib/rubino/api/operations/mode/show_operation.rb +29 -0
data/lib/rubino/api/operations/mode/update_operation.rb +42 -0
data/lib/rubino/api/operations/models/list_operation.rb +45 -0
data/lib/rubino/api/operations/oauth/connections/disconnect_operation.rb +77 -0
data/lib/rubino/api/operations/oauth/connections/list_operation.rb +36 -0
data/lib/rubino/api/operations/oauth/providers/callback_operation.rb +82 -0
data/lib/rubino/api/operations/oauth/providers/connect_operation.rb +44 -0
data/lib/rubino/api/operations/oauth/providers/list_operation.rb +35 -0
data/lib/rubino/api/operations/oauth/serializer.rb +21 -0
data/lib/rubino/api/operations/runs/create_operation.rb +77 -0
data/lib/rubino/api/operations/runs/events_operation.rb +195 -0
data/lib/rubino/api/operations/runs/stop_operation.rb +34 -0
data/lib/rubino/api/operations/sessions/create_operation.rb +46 -0
data/lib/rubino/api/operations/sessions/delete_operation.rb +33 -0
data/lib/rubino/api/operations/sessions/index_operation.rb +82 -0
data/lib/rubino/api/operations/sessions/retry_operation.rb +45 -0
data/lib/rubino/api/operations/sessions/show_operation.rb +59 -0
data/lib/rubino/api/operations/sessions/undo_operation.rb +38 -0
data/lib/rubino/api/operations/skills/list_operation.rb +34 -0
data/lib/rubino/api/operations/skills/toggle_operation.rb +40 -0
data/lib/rubino/api/operations/tasks/index_operation.rb +30 -0
data/lib/rubino/api/operations/tasks/serializer.rb +60 -0
data/lib/rubino/api/operations/tasks/show_operation.rb +33 -0
data/lib/rubino/api/operations/tasks/stop_operation.rb +47 -0
data/lib/rubino/api/request.rb +54 -0
data/lib/rubino/api/responses.rb +64 -0
data/lib/rubino/api/router.rb +72 -0
data/lib/rubino/api/schemas.rb +103 -0
data/lib/rubino/api/server.rb +102 -0
data/lib/rubino/api/tls.rb +108 -0
data/lib/rubino/attachments/classification.rb +16 -0
data/lib/rubino/attachments/classify.rb +171 -0
data/lib/rubino/attachments/defang.rb +47 -0
data/lib/rubino/attachments/policy.rb +36 -0
data/lib/rubino/attachments/preamble.rb +120 -0
data/lib/rubino/boot/encryption_key.rb +32 -0
data/lib/rubino/cli/chat/bang_shell.rb +257 -0
data/lib/rubino/cli/chat/completion_builder.rb +290 -0
data/lib/rubino/cli/chat/idle_card_host.rb +69 -0
data/lib/rubino/cli/chat/image_inbox.rb +168 -0
data/lib/rubino/cli/chat/session_resolver.rb +176 -0
data/lib/rubino/cli/chat_command.rb +1674 -0
data/lib/rubino/cli/commands.rb +250 -0
data/lib/rubino/cli/config_command.rb +96 -0
data/lib/rubino/cli/doctor_command.rb +251 -0
data/lib/rubino/cli/jobs_command.rb +60 -0
data/lib/rubino/cli/memory_command.rb +135 -0
data/lib/rubino/cli/onboarding_wizard.rb +207 -0
data/lib/rubino/cli/server_command.rb +139 -0
data/lib/rubino/cli/session_command.rb +125 -0
data/lib/rubino/cli/setup_command.rb +107 -0
data/lib/rubino/cli/skills_command.rb +85 -0
data/lib/rubino/cli/tools_command.rb +81 -0
data/lib/rubino/cli/trust_gate.rb +71 -0
data/lib/rubino/commands/built_ins.rb +46 -0
data/lib/rubino/commands/command.rb +116 -0
data/lib/rubino/commands/executor.rb +550 -0
data/lib/rubino/commands/handlers/agents.rb +510 -0
data/lib/rubino/commands/handlers/config.rb +88 -0
data/lib/rubino/commands/handlers/help.rb +148 -0
data/lib/rubino/commands/handlers/jobs.rb +71 -0
data/lib/rubino/commands/handlers/mcp.rb +229 -0
data/lib/rubino/commands/handlers/memory.rb +200 -0
data/lib/rubino/commands/handlers/sessions.rb +207 -0
data/lib/rubino/commands/handlers/skills.rb +195 -0
data/lib/rubino/commands/handlers/status.rb +211 -0
data/lib/rubino/commands/loader.rb +90 -0
data/lib/rubino/config/configuration.rb +455 -0
data/lib/rubino/config/defaults.rb +569 -0
data/lib/rubino/config/loader.rb +115 -0
data/lib/rubino/config/reasoning_prefs.rb +67 -0
data/lib/rubino/config/writer.rb +72 -0
data/lib/rubino/context/compressor.rb +149 -0
data/lib/rubino/context/environment_inspector.rb +176 -0
data/lib/rubino/context/file_discovery.rb +45 -0
data/lib/rubino/context/message_boundary.rb +39 -0
data/lib/rubino/context/prompt_assembler.rb +382 -0
data/lib/rubino/context/summary_builder.rb +159 -0
data/lib/rubino/context/token_budget.rb +68 -0
data/lib/rubino/context/tool_pair_sanitizer.rb +70 -0
data/lib/rubino/database/connection.rb +77 -0
data/lib/rubino/database/migrations/001_create_initial_schema.rb +156 -0
data/lib/rubino/database/migrations/002_create_runs.rb +45 -0
data/lib/rubino/database/migrations/003_create_skill_states.rb +15 -0
data/lib/rubino/database/migrations/004_create_cron_jobs.rb +36 -0
data/lib/rubino/database/migrations/005_create_oauth_connections.rb +27 -0
data/lib/rubino/database/migrations/006_create_webhook_deliveries.rb +34 -0
data/lib/rubino/database/migrations/007_create_messages_fts.rb +59 -0
data/lib/rubino/database/migrations/008_create_memory_facts.rb +75 -0
data/lib/rubino/database/migrations/009_create_memory_graph.rb +55 -0
data/lib/rubino/database/migrations/010_add_owner_pid_to_sessions.rb +20 -0
data/lib/rubino/database/migrator.rb +48 -0
data/lib/rubino/documents/converters/csv.rb +79 -0
data/lib/rubino/documents/converters/docx.rb +129 -0
data/lib/rubino/documents/converters/html.rb +28 -0
data/lib/rubino/documents/converters/json.rb +35 -0
data/lib/rubino/documents/converters/pdf.rb +59 -0
data/lib/rubino/documents/converters/plain.rb +68 -0
data/lib/rubino/documents/converters/pptx.rb +64 -0
data/lib/rubino/documents/converters/xlsx.rb +62 -0
data/lib/rubino/documents/converters/xml.rb +45 -0
data/lib/rubino/documents/html.rb +71 -0
data/lib/rubino/documents/registry.rb +68 -0
data/lib/rubino/documents/table.rb +63 -0
data/lib/rubino/documents.rb +50 -0
data/lib/rubino/errors.rb +119 -0
data/lib/rubino/files/workspace.rb +93 -0
data/lib/rubino/interaction/cancel_token.rb +43 -0
data/lib/rubino/interaction/clipboard_image.rb +84 -0
data/lib/rubino/interaction/event_bus.rb +48 -0
data/lib/rubino/interaction/events.rb +101 -0
data/lib/rubino/interaction/image_input.rb +127 -0
data/lib/rubino/interaction/input_queue.rb +117 -0
data/lib/rubino/interaction/lifecycle.rb +299 -0
data/lib/rubino/interaction/probe.rb +65 -0
data/lib/rubino/interaction/state.rb +56 -0
data/lib/rubino/jobs/cron_job_repository.rb +75 -0
data/lib/rubino/jobs/handlers/cleanup_sessions_job.rb +32 -0
data/lib/rubino/jobs/handlers/compact_session_job.rb +21 -0
data/lib/rubino/jobs/handlers/distill_skill_job.rb +186 -0
data/lib/rubino/jobs/handlers/extract_memory_job.rb +37 -0
data/lib/rubino/jobs/handlers/summarize_session_job.rb +21 -0
data/lib/rubino/jobs/queue.rb +184 -0
data/lib/rubino/jobs/registry.rb +45 -0
data/lib/rubino/jobs/runner.rb +79 -0
data/lib/rubino/jobs/scheduler.rb +138 -0
data/lib/rubino/jobs/webhook_delivery.rb +225 -0
data/lib/rubino/jobs/worker.rb +59 -0
data/lib/rubino/llm/adapter_factory.rb +47 -0
data/lib/rubino/llm/adapter_response.rb +65 -0
data/lib/rubino/llm/auxiliary_client.rb +61 -0
data/lib/rubino/llm/bedrock_bearer_client.rb +235 -0
data/lib/rubino/llm/content_builder.rb +55 -0
data/lib/rubino/llm/credential_check.rb +93 -0
data/lib/rubino/llm/error_classifier.rb +364 -0
data/lib/rubino/llm/fake_provider.rb +292 -0
data/lib/rubino/llm/inline_think_filter.rb +58 -0
data/lib/rubino/llm/model_catalog.rb +29 -0
data/lib/rubino/llm/provider_resolver.rb +48 -0
data/lib/rubino/llm/reasoning_manager.rb +100 -0
data/lib/rubino/llm/request.rb +56 -0
data/lib/rubino/llm/ruby_llm_adapter.rb +794 -0
data/lib/rubino/llm/scenario_loader.rb +68 -0
data/lib/rubino/llm/scenario_selector.rb +80 -0
data/lib/rubino/llm/scenarios/agent-creates-cron-failure.yml +29 -0
data/lib/rubino/llm/scenarios/agent-creates-cron.yml +36 -0
data/lib/rubino/llm/scenarios/analysis.yml +501 -0
data/lib/rubino/llm/scenarios/complex-analysis.yml +598 -0
data/lib/rubino/llm/scenarios/failure.yml +65 -0
data/lib/rubino/llm/scenarios/happy-path.yml +24 -0
data/lib/rubino/llm/scenarios/provider-quota-completed.yml +14 -0
data/lib/rubino/llm/scenarios/wide-table.yml +121 -0
data/lib/rubino/llm/scenarios/with-approvals.yml +50 -0
data/lib/rubino/llm/scenarios/with-artifacts.yml +98 -0
data/lib/rubino/llm/scenarios/with-clarify.yml +32 -0
data/lib/rubino/llm/scenarios/with-reasoning.yml +175 -0
data/lib/rubino/llm/scenarios/with-uploads.yml +104 -0
data/lib/rubino/llm/thinking_support.rb +84 -0
data/lib/rubino/llm/tool_bridge.rb +89 -0
data/lib/rubino/logger.rb +99 -0
data/lib/rubino/mcp/manager.rb +180 -0
data/lib/rubino/mcp/mcp_tool_wrapper.rb +69 -0
data/lib/rubino/mcp.rb +57 -0
data/lib/rubino/memory/backend.rb +104 -0
data/lib/rubino/memory/backends/default.rb +101 -0
data/lib/rubino/memory/backends/sqlite.rb +653 -0
data/lib/rubino/memory/backends.rb +53 -0
data/lib/rubino/memory/deduplicator.rb +74 -0
data/lib/rubino/memory/extractor.rb +85 -0
data/lib/rubino/memory/flusher.rb +31 -0
data/lib/rubino/memory/retriever.rb +50 -0
data/lib/rubino/memory/sqlite_extraction_prompt.rb +70 -0
data/lib/rubino/memory/sqlite_graph.rb +154 -0
data/lib/rubino/memory/store.rb +228 -0
data/lib/rubino/memory/threat_scanner.rb +68 -0
data/lib/rubino/metrics.rb +175 -0
data/lib/rubino/modes.rb +93 -0
data/lib/rubino/oauth/connection_repository.rb +95 -0
data/lib/rubino/oauth/provider/github.rb +75 -0
data/lib/rubino/oauth/provider/google.rb +59 -0
data/lib/rubino/oauth/provider.rb +149 -0
data/lib/rubino/oauth/registry.rb +86 -0
data/lib/rubino/oauth/token_encryptor.rb +87 -0
data/lib/rubino/plugins/registry.rb +75 -0
data/lib/rubino/plugins.rb +86 -0
data/lib/rubino/run/approval_gate.rb +243 -0
data/lib/rubino/run/attachment_downloader.rb +166 -0
data/lib/rubino/run/event_store.rb +74 -0
data/lib/rubino/run/executor.rb +383 -0
data/lib/rubino/run/gate_registry.rb +39 -0
data/lib/rubino/run/recorder.rb +69 -0
data/lib/rubino/run/repository.rb +118 -0
data/lib/rubino/run/session_approval_cache.rb +118 -0
data/lib/rubino/security/allowlist_persister.rb +55 -0
data/lib/rubino/security/approval_policy.rb +227 -0
data/lib/rubino/security/command_allowlist.rb +24 -0
data/lib/rubino/security/dangerous_patterns.rb +118 -0
data/lib/rubino/security/deny_persister.rb +73 -0
data/lib/rubino/security/doom_loop_detector.rb +43 -0
data/lib/rubino/security/hardline_guard.rb +105 -0
data/lib/rubino/security/pattern_matcher.rb +62 -0
data/lib/rubino/security/prefix_deriver.rb +124 -0
data/lib/rubino/security/readonly_commands.rb +211 -0
data/lib/rubino/session/exporter.rb +101 -0
data/lib/rubino/session/message.rb +77 -0
data/lib/rubino/session/repository.rb +295 -0
data/lib/rubino/session/store.rb +198 -0
data/lib/rubino/session/summary_store.rb +65 -0
data/lib/rubino/skills/prompt_index.rb +85 -0
data/lib/rubino/skills/registry.rb +208 -0
data/lib/rubino/skills/skill.rb +176 -0
data/lib/rubino/skills/skill_tool.rb +215 -0
data/lib/rubino/skills/state_repository.rb +37 -0
data/lib/rubino/skills/toggle.rb +26 -0
data/lib/rubino/tools/answer_child_tool.rb +83 -0
data/lib/rubino/tools/ask_parent_tool.rb +232 -0
data/lib/rubino/tools/attach_file_tool.rb +120 -0
data/lib/rubino/tools/background_tasks.rb +520 -0
data/lib/rubino/tools/base.rb +222 -0
data/lib/rubino/tools/custom_tool_loader.rb +119 -0
data/lib/rubino/tools/edit_tool.rb +122 -0
data/lib/rubino/tools/git_tool.rb +71 -0
data/lib/rubino/tools/github_tool.rb +233 -0
data/lib/rubino/tools/glob_tool.rb +69 -0
data/lib/rubino/tools/grep_tool.rb +206 -0
data/lib/rubino/tools/memory_tool.rb +184 -0
data/lib/rubino/tools/multi_edit_tool.rb +110 -0
data/lib/rubino/tools/patch_tool.rb +260 -0
data/lib/rubino/tools/probe_tool.rb +175 -0
data/lib/rubino/tools/question_tool.rb +128 -0
data/lib/rubino/tools/read_attachment_tool.rb +180 -0
data/lib/rubino/tools/read_tool.rb +212 -0
data/lib/rubino/tools/read_tracker.rb +98 -0
data/lib/rubino/tools/registry.rb +166 -0
data/lib/rubino/tools/result.rb +113 -0
data/lib/rubino/tools/ruby_tool.rb +0 -0
data/lib/rubino/tools/session_search_tool.rb +103 -0
data/lib/rubino/tools/shell_input_tool.rb +96 -0
data/lib/rubino/tools/shell_kill_tool.rb +76 -0
data/lib/rubino/tools/shell_output_tool.rb +72 -0
data/lib/rubino/tools/shell_registry.rb +158 -0
data/lib/rubino/tools/shell_tail_tool.rb +118 -0
data/lib/rubino/tools/shell_tool.rb +330 -0
data/lib/rubino/tools/steer_tool.rb +118 -0
data/lib/rubino/tools/subagent_probe.rb +89 -0
data/lib/rubino/tools/summarize_file_tool.rb +182 -0
data/lib/rubino/tools/task_result_tool.rb +90 -0
data/lib/rubino/tools/task_stop_tool.rb +80 -0
data/lib/rubino/tools/task_tool.rb +622 -0
data/lib/rubino/tools/test_tool.rb +454 -0
data/lib/rubino/tools/todo_tool.rb +93 -0
data/lib/rubino/tools/tool_call_repository.rb +33 -0
data/lib/rubino/tools/vision_tool.rb +85 -0
data/lib/rubino/tools/webfetch_tool.rb +153 -0
data/lib/rubino/tools/websearch_tool.rb +179 -0
data/lib/rubino/tools/write_tool.rb +61 -0
data/lib/rubino/trust.rb +88 -0
data/lib/rubino/ui/api.rb +296 -0
data/lib/rubino/ui/base.rb +252 -0
data/lib/rubino/ui/bottom_composer.rb +1599 -0
data/lib/rubino/ui/cli.rb +1987 -0
data/lib/rubino/ui/completion_menu.rb +321 -0
data/lib/rubino/ui/completion_source.rb +284 -0
data/lib/rubino/ui/escape_reader.rb +169 -0
data/lib/rubino/ui/indented_io.rb +88 -0
data/lib/rubino/ui/input_history.rb +108 -0
data/lib/rubino/ui/live_region.rb +183 -0
data/lib/rubino/ui/markdown_renderer.rb +506 -0
data/lib/rubino/ui/notifier.rb +163 -0
data/lib/rubino/ui/null.rb +195 -0
data/lib/rubino/ui/paste_store.rb +176 -0
data/lib/rubino/ui/printer_base.rb +79 -0
data/lib/rubino/ui/probe_wait_indicator.rb +75 -0
data/lib/rubino/ui/queued_indicators.rb +66 -0
data/lib/rubino/ui/status_bar.rb +100 -0
data/lib/rubino/ui/stdout_proxy.rb +161 -0
data/lib/rubino/ui/streaming_markdown.rb +186 -0
data/lib/rubino/ui/subagent_cards.rb +134 -0
data/lib/rubino/ui/subagent_view.rb +255 -0
data/lib/rubino/ui.rb +21 -0
data/lib/rubino/update_check.rb +187 -0
data/lib/rubino/util/duration.rb +23 -0
data/lib/rubino/util/hyperlink.rb +105 -0
data/lib/rubino/util/output.rb +145 -0
data/lib/rubino/util/secrets_mask.rb +83 -0
data/lib/rubino/version.rb +5 -0
data/lib/rubino/workspace.rb +85 -0
data/lib/rubino-agent.rb +5 -0
data/lib/rubino.rb +318 -0
data/mise.toml +2 -0
data/rubino-agent.gemspec +103 -0
data/skills/ruby-expert/SKILL.md +67 -0
data/skills/ruby-expert/references/concurrency.md +357 -0
data/skills/ruby-expert/references/datetime-and-encoding.md +363 -0
data/skills/ruby-expert/references/errors-and-types.md +460 -0
data/skills/ruby-expert/references/gem-authoring.md +459 -0
data/skills/ruby-expert/references/language-idioms.md +465 -0
data/skills/ruby-expert/references/metaprogramming.md +339 -0
data/skills/ruby-expert/references/oo-design.md +553 -0
data/skills/ruby-expert/references/performance.md +383 -0
data/skills/ruby-expert/references/rails.md +424 -0
data/skills/ruby-expert/references/security.md +404 -0
data/skills/ruby-expert/references/testing.md +473 -0
data/skills/ruby-expert/references/tooling.md +466 -0
metadata +856 -0

data/lib/rubino/tools/test_tool.rb ADDED Viewed

@@ -0,0 +1,454 @@
+# frozen_string_literal: true
+module Rubino
+  module Tools
+    # Runs the workspace project's test suite and returns a STRUCTURED result
+    # instead of the raw toolchain firehose the `shell` tool emits.
+    #
+    # Why this exists (issue #101): to run tests the model used to drive `shell`
+    # and reason its way through the whole Ruby toolchain — bundler version
+    # mismatches, missing gems, which command to use. On real tasks that burned
+    # several tool calls and twice sent the agent chasing toolchain errors
+    # (bundler `GemNotFound`, an `undefined method 'untaint'` crash from an old
+    # pinned bundler) instead of the user's actual request; one earlier run even
+    # drifted toward `gem uninstall bundler` / `rm -rf …`. This tool:
+    #
+    #   - auto-detects the framework (rspec / minitest / rake) and the right
+    #     invocation, preferring `bundle exec` when a Gemfile is present and the
+    #     bundle is usable, falling back to the bare runner when it is not (so a
+    #     stale lockfile degrades gracefully rather than making the model fight
+    #     bundler),
+    #   - returns pass/fail counts, the failing examples (name + file:line +
+    #     short message) parsed from the runner output, and a short raw tail —
+    #     not the full backtrace,
+    #   - distinguishes "the suite could not even start" (toolchain error) from
+    #     "the suite ran and N failed", via the structured `error_code`.
+    #
+    # Execution mirrors ShellTool's foreground path: own process group, SIGTERM
+    # on timeout/cancel, cwd = workspace root (same resolution as ruby/shell).
+    class TestTool < Base
+      DEFAULT_TIMEOUT = 300
+      MAX_TIMEOUT     = 600
+      TICK            = 0.05
+      # Lines of raw runner output to keep for context. Enough to show the
+      # tail of a failure dump without dragging the full backtrace into context.
+      RAW_TAIL_LINES  = 40
+      def name
+        "run_tests"
+      end
+      def description
+        "Run the workspace project's test suite and return a structured result " \
+          "(framework, command, exit status, example/failure counts, and the " \
+          "failing examples with file:line and message). Auto-detects RSpec, " \
+          "Minitest, or a Rakefile default task; prefers `bundle exec` when a " \
+          "Gemfile is present and falls back to the bare runner if the bundle is " \
+          "broken. Optional `path` runs a single file or pattern; optional " \
+          "`framework` (rspec/minitest/rake) overrides detection. Use this " \
+          "instead of driving `shell` by hand to run tests."
+      end
+      def input_schema
+        {
+          type: "object",
+          properties: {
+            path: {
+              type: "string",
+              description: "Optional file or pattern to run a subset (e.g. " \
+                           "'spec/models/user_spec.rb' or 'spec/models/'). " \
+                           "Runs the whole suite when omitted."
+            },
+            framework: {
+              type: "string",
+              enum: %w[rspec minitest rake],
+              description: "Override framework detection. Omit to auto-detect."
+            },
+            timeout: {
+              type: "integer",
+              description: "Timeout in seconds (default #{DEFAULT_TIMEOUT}, max #{MAX_TIMEOUT})."
+            }
+          },
+          required: []
+        }
+      end
+      # Runs project code (the test suite), so gated like `ruby`: not
+      # destructive, but it does execute arbitrary code. :medium → asks in
+      # manual mode, auto-allowed in auto mode.
+      def risk_level
+        :medium
+      end
+      def call(arguments)
+        args      = arguments.is_a?(Hash) ? arguments : {}
+        path      = args["path"]      || args[:path]
+        override  = args["framework"] || args[:framework]
+        timeout   = (args["timeout"]  || args[:timeout] || DEFAULT_TIMEOUT).to_i
+        timeout   = [[timeout, 1].max, MAX_TIMEOUT].min
+        root = resolve_workspace
+        return { output: "Error: cannot access workspace directory", error_code: :workspace_error } unless root
+        framework = (override && !override.to_s.empty? ? override.to_s : detect_framework(root))
+        unless framework
+          return { output: "Error: no test setup detected in #{root} — looked for " \
+                           "spec/ (.rspec), test/, and a Rakefile. Pass `framework` " \
+                           "to override, or use the shell tool for a custom command.",
+                   error_code: :no_test_setup }
+        end
+        command = build_command(root, framework, path)
+        run     = execute(command, root, timeout)
+        build_result(framework, command, run)
+      end
+      private
+      # Same cwd resolution as ruby_tool/shell_tool: terminal.cwd or Dir.pwd,
+      # fully resolved through symlinks. nil if it can't be reached.
+      def resolve_workspace
+        candidate = Rubino::Workspace.primary_root
+        path = File.realpath(File.expand_path(candidate))
+        File.directory?(path) ? path : nil
+      rescue Errno::ENOENT, Errno::EACCES, Errno::ELOOP
+        nil
+      end
+      # Detection order mirrors the issue: RSpec first (most common in gems),
+      # then Minitest, then a bare Rakefile default task.
+      def detect_framework(root)
+        return "rspec"    if rspec?(root)
+        return "minitest" if minitest?(root)
+        return "rake"     if File.exist?(File.join(root, "Rakefile"))
+        nil
+      end
+      def rspec?(root)
+        File.exist?(File.join(root, ".rspec")) ||
+          File.directory?(File.join(root, "spec"))
+      end
+      def minitest?(root)
+        return false unless File.directory?(File.join(root, "test"))
+        # A `test/` dir alone is the signal; rake/rails drive it. We don't try
+        # to grep for `require "minitest"` — too fragile across layouts.
+        true
+      end
+      def gemfile?(root)
+        File.exist?(File.join(root, "Gemfile"))
+      end
+      # Prefer `bundle exec` when a Gemfile is present AND the bundle resolves;
+      # otherwise fall back to the bare runner. The fallback is the whole point
+      # of #101: a stale/pinned lockfile must not make the model fight bundler.
+      def build_command(root, framework, path)
+        bundle = gemfile?(root) && bundle_usable?(root)
+        prefix = bundle ? "bundle exec " : ""
+        case framework
+        when "rspec"
+          target = path && !path.to_s.empty? ? " #{shellescape(path)}" : ""
+          "#{prefix}rspec#{target}"
+        when "minitest"
+          build_minitest_command(root, prefix, path)
+        when "rake"
+          "#{prefix}rake"
+        end
+      end
+      # `rake test` is the canonical entry for a Minitest project (it sets up
+      # $LOAD_PATH and picks up test/**). When the model wants a single file we
+      # can't go through rake's task, so run it with ruby -Itest -Ilib directly.
+      def build_minitest_command(root, prefix, path)
+        if path && !path.to_s.empty?
+          "#{prefix}ruby -Itest -Ilib #{shellescape(path)}"
+        elsif rails?(root)
+          "#{prefix}bin/rails test"
+        else
+          "#{prefix}rake test"
+        end
+      end
+      def rails?(root)
+        File.exist?(File.join(root, "bin", "rails"))
+      end
+      # Cheap, non-mutating bundle check: `bundle check` exits 0 only when the
+      # gems in the lockfile are installed and satisfiable. Catches the #101
+      # cases (version-mismatched / pinned-bundler lockfiles) before we commit
+      # to `bundle exec`, so we degrade to the bare runner instead of letting
+      # the model watch a bundler backtrace scroll by. Capped tight so a slow
+      # `bundle check` never dominates the call.
+      def bundle_usable?(root)
+        _, status = Open3.capture2e(
+          { "BUNDLE_GEMFILE" => File.join(root, "Gemfile") },
+          "bundle", "check",
+          chdir: root
+        )
+        status&.success?
+      rescue StandardError
+        # bundler not installed, or it crashed (the untaint-style failure):
+        # treat the bundle as unusable and fall back to the bare runner.
+        false
+      end
+      def shellescape(str)
+        require "shellwords"
+        Shellwords.escape(str.to_s)
+      end
+      # Foreground exec in its own process group, SIGTERM on timeout/cancel.
+      # Merged stdout+stderr — the runners interleave results and warnings, and
+      # we parse the combined stream anyway. Returns a structured run hash.
+      def execute(command, cwd, timeout)
+        require "open3"
+        rd, wr = IO.pipe
+        pid    = Process.spawn(command, chdir: cwd, pgroup: true, out: wr, err: wr)
+        pgid   = pid
+        wr.close
+        buf = +""
+        reader = Thread.new do
+          rd.each_line do |line|
+            buf << line
+            emit_chunk(line)
+          end
+        rescue IOError, Errno::EBADF
+          # pipe closed — process exited
+        ensure
+          rd.close unless rd.closed?
+        end
+        started  = Process.clock_gettime(Process::CLOCK_MONOTONIC)
+        deadline = Time.now + timeout
+        status   = nil
+        loop do
+          wpid, status = Process.waitpid2(pid, Process::WNOHANG)
+          break if wpid
+          if cancellation_requested?
+            terminate_group(pgid)
+            reader.join(0.5)
+            begin
+              Process.kill("KILL", -pgid)
+            rescue StandardError
+              nil
+            end
+            begin
+              Process.waitpid2(pid)
+            rescue StandardError
+              nil
+            end
+            return { output: buf.dup, exit_code: nil, cancelled: true, timed_out: false,
+                     duration_ms: elapsed_ms(started) }
+          end
+          if Time.now >= deadline
+            terminate_group(pgid)
+            _, status = Process.waitpid2(pid, Process::WNOHANG)
+            unless status
+              reader.join(2)
+              begin
+                Process.kill("KILL", -pgid)
+              rescue StandardError
+                nil
+              end
+              _, status = Process.waitpid2(pid)
+            end
+            reader.join(0.5)
+            return { output: buf.dup, exit_code: nil, cancelled: false, timed_out: true,
+                     duration_ms: elapsed_ms(started) }
+          end
+          sleep TICK
+        end
+        reader.join
+        { output: buf, exit_code: status&.exitstatus, cancelled: false, timed_out: false,
+          duration_ms: elapsed_ms(started) }
+      rescue StandardError => e
+        { output: "Error launching tests: #{e.message}", exit_code: nil, cancelled: false,
+          timed_out: false, started_error: true, duration_ms: 0 }
+      ensure
+        rd.close if rd && !rd.closed?
+      end
+      def terminate_group(pgid)
+        Process.kill("TERM", -pgid)
+      rescue Errno::ESRCH, Errno::EPERM
+        # already gone / not ours
+      end
+      def elapsed_ms(started)
+        ((Process.clock_gettime(Process::CLOCK_MONOTONIC) - started) * 1000).round
+      end
+      # Turns the run hash into the model-facing structured Result. Parses the
+      # combined output into counts + failing examples, classifies the outcome,
+      # and keeps a short raw tail for context.
+      def build_result(framework, command, run)
+        raw     = run[:output].to_s
+        parsed  = parse_output(framework, raw)
+        ran     = parsed[:ran]
+        tail    = tail_lines(raw)
+        outcome, error_code = classify(run, parsed)
+        summary = build_summary(framework, command, run, parsed, outcome)
+        body    = [summary, "", "--- raw output (tail) ---", tail].join("\n")
+        {
+          output: body,
+          body: summary,
+          body_kind: :plain,
+          metrics: "#{outcome} · #{format_ms(run[:duration_ms])}",
+          error_code: error_code,
+          # Structured fields, so the executor / future contract tests can
+          # branch without re-parsing the text.
+          framework: framework,
+          command: command,
+          exit_code: run[:exit_code],
+          ran: ran,
+          examples: parsed[:examples],
+          failures: parsed[:failures],
+          failing: parsed[:failing]
+        }
+      end
+      # outcome label + error_code symbol. The critical distinction (#101):
+      # the suite NOT starting (toolchain error) vs. running with failures.
+      def classify(run, parsed)
+        return ["cancelled", :cancelled]      if run[:cancelled]
+        return ["timeout", :timeout]          if run[:timed_out]
+        return ["could not start", :test_runner_error] if run[:started_error] || !parsed[:ran]
+        return ["#{parsed[:failures]} failed", :tests_failed] if parsed[:failures].to_i.positive?
+        return ["nonzero exit", :exit_nonzero] if run[:exit_code] && run[:exit_code] != 0
+        ["passed", nil]
+      end
+      def build_summary(framework, command, run, parsed, outcome)
+        lines = []
+        lines << "framework: #{framework}"
+        lines << "command:   #{command}"
+        lines << "exit:      #{run[:exit_code].nil? ? "(none)" : run[:exit_code]}"
+        lines << "outcome:   #{outcome}"
+        if parsed[:ran]
+          lines << "examples:  #{parsed[:examples].nil? ? "?" : parsed[:examples]}"
+          lines << "failures:  #{parsed[:failures].nil? ? "?" : parsed[:failures]}"
+          unless parsed[:failing].empty?
+            lines << "failing:"
+            parsed[:failing].each do |f|
+              loc  = f[:location] ? " (#{f[:location]})" : ""
+              desc = f[:description].to_s
+              msg  = f[:message].to_s.empty? ? "" : " — #{f[:message]}"
+              lines << "  - #{desc}#{loc}#{msg}"
+            end
+          end
+        else
+          lines << "note:      the suite did not run (toolchain/setup error) — " \
+                   "see the raw tail below"
+        end
+        lines.join("\n")
+      end
+      def tail_lines(raw)
+        lines = raw.lines.map(&:chomp)
+        return raw.chomp if lines.size <= RAW_TAIL_LINES
+        ["… [#{lines.size - RAW_TAIL_LINES} earlier lines omitted] …"]
+          .concat(lines.last(RAW_TAIL_LINES)).join("\n")
+      end
+      def parse_output(framework, raw)
+        case framework
+        when "rspec"          then parse_rspec(raw)
+        when "minitest"       then parse_minitest(raw)
+        else                       parse_generic(raw)
+        end
+      end
+      # RSpec: "N examples, M failures[, K pending]" summary line, and the
+      # "Failures:" block with "rspec ./path:line # description".
+      def parse_rspec(raw)
+        summary = raw.match(/(\d+)\s+examples?,\s+(\d+)\s+failures?/)
+        return parse_generic(raw) unless summary
+        examples = summary[1].to_i
+        failures = summary[2].to_i
+        failing = []
+        # The rerun lines RSpec prints at the bottom give location +
+        # description; the numbered Failures: block gives the message.
+        messages = rspec_failure_messages(raw)
+        raw.scan(%r{^rspec\s+(\.?/?\S+:\d+)\s+#\s+(.+)$}).each_with_index do |(loc, desc), i|
+          failing << { description: desc.strip, location: loc.strip, message: messages[i] }
+        end
+        { ran: true, examples: examples, failures: failures, failing: failing }
+      end
+      # Pulls the first line of each numbered failure block in RSpec's
+      # "Failures:" section: "  1) Some description\n     Failure/Error: ...\n
+      # <message>". We grab the message line(s) after Failure/Error.
+      def rspec_failure_messages(raw)
+        section = raw[/^Failures:\n(.*?)(?:\n\nFinished|\n\n\d+ examples?)/m, 1]
+        return [] unless section
+        section.split(/^\s*\d+\)\s/).reject(&:empty?).map do |block|
+          msg = block[%r{Failure/Error:.*?\n\s*\n?\s*(.+)}m, 1] ||
+                block[%r{Failure/Error:\s*(.+)}, 1]
+          msg.to_s.lines.first.to_s.strip
+        end
+      end
+      # Minitest: "N runs, M assertions, F failures, E errors, S skips".
+      # Failures/errors print as numbered blocks headed by
+      # "TestClass#test_name [file:line]:".
+      def parse_minitest(raw)
+        summary = raw.match(/(\d+)\s+runs?,\s+(\d+)\s+assertions?,\s+(\d+)\s+failures?,\s+(\d+)\s+errors?/)
+        return parse_generic(raw) unless summary
+        runs     = summary[1].to_i
+        failures = summary[3].to_i + summary[4].to_i # failures + errors
+        failing = []
+        raw.scan(/^\s*\d+\)\s+(?:Failure|Error):\n\s*(\S+)\s*\[([^\]]+)\]:\n(.+)/).each do |name, loc, msg|
+          failing << { description: name.strip, location: loc.strip, message: msg.to_s.lines.first.to_s.strip }
+        end
+        # Some minitest reporters omit the "Failure:/Error:" label line.
+        if failing.empty?
+          raw.scan(/^\s*\d+\)\s+(\S+#\S+)\s*\[([^\]]+)\]:\n(.+)/).each do |name, loc, msg|
+            failing << { description: name.strip, location: loc.strip, message: msg.to_s.lines.first.to_s.strip }
+          end
+        end
+        { ran: true, examples: runs, failures: failures, failing: failing }
+      end
+      # No recognizable summary line: we can't trust counts. Treat as "ran" only
+      # if there's a hint the runner produced test output; otherwise leave ran
+      # to the exit-code classifier (started_error / nonzero) upstream.
+      def parse_generic(raw)
+        ran = raw.match?(/\d+\s+(examples?|runs?|tests?)/) ||
+              raw.match?(/Finished in/)
+        { ran: ran, examples: nil, failures: nil, failing: [] }
+      end
+      def format_ms(ms)
+        if ms < 1000      then "#{ms}ms"
+        elsif ms < 60_000 then "#{(ms / 1000.0).round(1)}s"
+        else
+          mins, rem = ms.divmod(60_000)
+          "#{mins}m#{(rem / 1000.0).round}s"
+        end
+      end
+    end
+  end
+end

data/lib/rubino/tools/todo_tool.rb ADDED Viewed

@@ -0,0 +1,93 @@
+# frozen_string_literal: true
+module Rubino
+  module Tools
+    # Tool for managing a task/todo list during a session.
+    # Allows the agent to track progress on complex multi-step tasks.
+    class TodoTool < Base
+      def name
+        "todowrite"
+      end
+      def description
+        "Create and manage a structured task list for the current session. " \
+          "Use this to track progress on complex multi-step tasks. " \
+          "Tasks have content, status (pending/in_progress/completed/cancelled), and priority."
+      end
+      def input_schema
+        {
+          type: "object",
+          properties: {
+            todos: {
+              type: "array",
+              items: {
+                type: "object",
+                properties: {
+                  content: { type: "string", description: "Brief description of the task" },
+                  status: {
+                    type: "string",
+                    enum: %w[pending in_progress completed cancelled],
+                    description: "Current task status"
+                  },
+                  priority: {
+                    type: "string",
+                    enum: %w[high medium low],
+                    description: "Task priority level"
+                  }
+                },
+                required: %w[content status priority]
+              },
+              description: "The complete updated todo list"
+            }
+          },
+          required: %w[todos]
+        }
+      end
+      def risk_level
+        :low
+      end
+      def call(arguments)
+        todos = arguments["todos"] || arguments[:todos]
+        return "Error: No todos provided" unless todos.is_a?(Array)
+        format_todo_summary(todos)
+      end
+      private
+      def format_todo_summary(todos)
+        completed = todos.count { |t| t["status"] == "completed" || t[:status] == "completed" }
+        in_progress = todos.count { |t| t["status"] == "in_progress" || t[:status] == "in_progress" }
+        pending = todos.count { |t| t["status"] == "pending" || t[:status] == "pending" }
+        cancelled = todos.count { |t| t["status"] == "cancelled" || t[:status] == "cancelled" }
+        lines = ["Todo list updated (#{todos.size} items):"]
+        lines << "  Completed: #{completed}" if completed > 0
+        lines << "  In Progress: #{in_progress}" if in_progress > 0
+        lines << "  Pending: #{pending}" if pending > 0
+        lines << "  Cancelled: #{cancelled}" if cancelled > 0
+        lines << ""
+        todos.each do |todo|
+          content = todo["content"] || todo[:content]
+          status = todo["status"] || todo[:status]
+          priority = todo["priority"] || todo[:priority]
+          icon = case status
+                 when "completed" then "[x]"
+                 when "in_progress" then "[>]"
+                 when "cancelled" then "[-]"
+                 else "[ ]"
+                 end
+          lines << "  #{icon} #{content} (#{priority})"
+        end
+        lines.join("\n")
+      end
+    end
+  end
+end

data/lib/rubino/tools/tool_call_repository.rb ADDED Viewed

@@ -0,0 +1,33 @@
+# frozen_string_literal: true
+require "securerandom"
+require "json"
+module Rubino
+  module Tools
+    # Persists tool call audit records to the database.
+    # Extracted from Agent::ToolExecutor to respect the separation between
+    # domain execution logic and storage concerns.
+    class ToolCallRepository
+      # Persists a tool call record. Failures are swallowed so that a
+      # database outage never causes a tool call to fail.
+      def record(name:, call_id:, arguments:, result:, status:, error: nil)
+        now = Time.now.utc.iso8601
+        Rubino.database.db[:tool_calls].insert(
+          id: call_id || SecureRandom.uuid,
+          session_id: result.session_id,
+          tool_name: name,
+          input_json: JSON.generate(arguments),
+          output: result.output,
+          status: status,
+          started_at: now,
+          finished_at: now,
+          error: error
+        )
+      rescue StandardError
+        # Don't fail the tool call just because audit persistence failed.
+        nil
+      end
+    end
+  end
+end

data/lib/rubino/tools/vision_tool.rb ADDED Viewed

@@ -0,0 +1,85 @@
+# frozen_string_literal: true
+require_relative "../llm/auxiliary_client"
+module Rubino
+  module Tools
+    # Delegates image-understanding to a multimodal aux model so a text-only
+    # primary can still "see" what the user uploaded. Implements the
+    # agent-as-tool semantics from the OpenAI Agents SDK: the primary stays
+    # in control, calls this tool with a focused question, and receives a
+    # structured (text) reply — no conversation handoff, no shared history.
+    #
+    # The aux model is resolved from `auxiliary.vision` in config. When the
+    # primary already supports vision (per Configuration#model_supports_vision?)
+    # AND no aux is configured, Registry hides this tool — there's no useful
+    # delegation to perform.
+    class VisionTool < Base
+      def name
+        "vision"
+      end
+      def description
+        "Ask a multimodal model to describe or interpret an image. " \
+          "Use when you need to understand visual content (charts, screenshots, " \
+          "diagrams, photos). Provide an optional focused question to direct the " \
+          "analysis; default is a full markdown description."
+      end
+      def input_schema
+        {
+          type: "object",
+          properties: {
+            file_path: {
+              type: "string",
+              description: "Absolute path to an image file (.png .jpg .jpeg .webp .gif .bmp)"
+            },
+            question: {
+              type: "string",
+              description: "Optional focused question. Default: 'Describe what you see in markdown.'"
+            }
+          },
+          required: %w[file_path]
+        }
+      end
+      def risk_level
+        :low
+      end
+      def call(arguments)
+        path     = (arguments["file_path"] || arguments[:file_path]).to_s
+        question = (arguments["question"]  || arguments[:question] ||
+                    "Describe what you see in markdown.").to_s
+        return "Error: file_path is required" if path.empty?
+        expanded = File.expand_path(path)
+        return "Error: file not found: #{path}" unless File.exist?(expanded)
+        return "Error: not a regular file: #{path}" unless File.file?(expanded)
+        ext = File.extname(expanded).downcase
+        unless LLM::ContentBuilder::SUPPORTED_IMAGE_TYPES.include?(ext)
+          return "Error: unsupported image extension '#{ext}'. " \
+                 "Supported: #{LLM::ContentBuilder::SUPPORTED_IMAGE_TYPES.join(", ")}"
+        end
+        # Pass the image through ruby_llm's native `with:` slot (image_paths),
+        # NOT as an OpenAI-style content array. ruby_llm's `ask` stringifies an
+        # array content, so the base64 bytes would reach the model as TEXT and
+        # it hallucinates (prod sessions 38/41: M3 saw the image perfectly when
+        # called directly, but got a text blob through this path). image_paths
+        # attaches the file as a real multimodal part — same route the primary
+        # uses for native vision.
+        response = LLM::AuxiliaryClient.new.call(
+          task: :vision,
+          messages: [{ role: "user", content: question }],
+          image_paths: [expanded]
+        )
+        response.content.to_s
+      rescue StandardError => e
+        "Error calling vision model: #{e.class}: #{e.message}"
+      end
+    end
+  end
+end