RubyGems - anima-core - Versions diffs - 1.4.0 → 1.5.0 - Mend

anima-core 1.4.0 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (149) hide show

checksums.yaml +4 -4
data/.reek.yml +18 -20
data/README.md +61 -95
data/agents/thoughts-analyzer.md +12 -7
data/anima-core.gemspec +1 -0
data/app/channels/session_channel.rb +38 -58
data/app/decorators/agent_message_decorator.rb +7 -2
data/app/decorators/message_decorator.rb +31 -100
data/app/decorators/pending_from_melete_decorator.rb +36 -0
data/app/decorators/pending_from_melete_goal_decorator.rb +13 -0
data/app/decorators/pending_from_melete_skill_decorator.rb +19 -0
data/app/decorators/pending_from_melete_workflow_decorator.rb +13 -0
data/app/decorators/pending_from_mneme_decorator.rb +44 -0
data/app/decorators/pending_message_decorator.rb +94 -0
data/app/decorators/pending_subagent_decorator.rb +46 -0
data/app/decorators/pending_tool_response_decorator.rb +51 -0
data/app/decorators/pending_user_message_decorator.rb +22 -0
data/app/decorators/system_message_decorator.rb +5 -0
data/app/decorators/tool_call_decorator.rb +13 -2
data/app/decorators/tool_response_decorator.rb +2 -2
data/app/decorators/user_message_decorator.rb +7 -2
data/app/jobs/count_tokens_job.rb +23 -0
data/app/jobs/drain_job.rb +169 -0
data/app/jobs/melete_enrichment_job/goal_change_listener.rb +52 -0
data/app/jobs/melete_enrichment_job.rb +48 -0
data/app/jobs/mneme_enrichment_job.rb +46 -0
data/app/jobs/tool_execution_job.rb +87 -0
data/app/models/concerns/token_estimation.rb +54 -0
data/app/models/goal.rb +21 -10
data/app/models/message.rb +47 -36
data/app/models/pending_message.rb +276 -29
data/app/models/pinned_message.rb +8 -3
data/app/models/session.rb +468 -432
data/app/models/snapshot.rb +11 -21
data/bin/inspect-cassette +17 -4
data/config/application.rb +1 -0
data/config/initializers/event_subscribers.rb +71 -4
data/config/initializers/inflections.rb +3 -1
data/db/cable_structure.sql +3 -3
data/db/migrate/20260407170803_remove_viewport_message_ids_from_sessions.rb +5 -0
data/db/migrate/20260407180400_remove_mneme_snapshot_pointer_columns_from_sessions.rb +6 -0
data/db/migrate/20260411120553_add_token_count_to_pinned_messages.rb +5 -0
data/db/migrate/20260411172926_remove_active_skills_and_workflow_from_sessions.rb +6 -0
data/db/migrate/20260412110625_replace_processing_with_aasm_state.rb +6 -0
data/db/migrate/20260418150323_add_kind_and_message_type_to_pending_messages.rb +6 -0
data/db/migrate/20260419120000_add_drain_fields_to_pending_messages.rb +7 -0
data/db/migrate/20260419130000_drop_pending_messages_kind_default.rb +5 -0
data/db/migrate/20260419140000_add_drain_indexes_to_pending_messages.rb +8 -0
data/db/migrate/20260420100000_add_hud_visibility_to_sessions.rb +15 -0
data/db/queue_structure.sql +13 -13
data/db/structure.sql +44 -31
data/lib/agents/registry.rb +1 -1
data/lib/anima/settings.rb +7 -33
data/lib/anima/version.rb +1 -1
data/lib/events/authentication_required.rb +24 -0
data/lib/events/bounce_back.rb +4 -4
data/lib/events/eviction_completed.rb +28 -0
data/lib/events/goal_created.rb +28 -0
data/lib/events/goal_updated.rb +32 -0
data/lib/events/llm_responded.rb +35 -0
data/lib/events/message_created.rb +27 -0
data/lib/events/message_updated.rb +25 -0
data/lib/events/session_state_changed.rb +30 -0
data/lib/events/skill_activated.rb +28 -0
data/lib/events/start_melete.rb +36 -0
data/lib/events/start_mneme.rb +33 -0
data/lib/events/start_processing.rb +32 -0
data/lib/events/subagent_evicted.rb +31 -0
data/lib/events/subscribers/active_state_broadcaster.rb +27 -0
data/lib/events/subscribers/authentication_broadcaster.rb +34 -0
data/lib/events/subscribers/drain_kickoff.rb +20 -0
data/lib/events/subscribers/eviction_broadcaster.rb +26 -0
data/lib/events/subscribers/llm_response_handler.rb +111 -0
data/lib/events/subscribers/melete_kickoff.rb +24 -0
data/lib/events/subscribers/message_broadcaster.rb +34 -0
data/lib/events/subscribers/mneme_kickoff.rb +24 -0
data/lib/events/subscribers/mneme_scheduler.rb +21 -0
data/lib/events/subscribers/persister.rb +6 -8
data/lib/events/subscribers/session_state_broadcaster.rb +33 -0
data/lib/events/subscribers/subagent_message_router.rb +26 -29
data/lib/events/subscribers/subagent_visibility_broadcaster.rb +33 -0
data/lib/events/subscribers/tool_response_creator.rb +33 -0
data/lib/events/subscribers/transient_broadcaster.rb +1 -1
data/lib/events/tool_executed.rb +34 -0
data/lib/events/workflow_activated.rb +27 -0
data/lib/llm/client.rb +41 -201
data/lib/mcp/client_manager.rb +41 -46
data/lib/mcp/stdio_transport.rb +9 -5
data/lib/{analytical_brain → melete}/runner.rb +63 -68
data/lib/{analytical_brain → melete}/tools/activate_skill.rb +1 -1
data/lib/{analytical_brain → melete}/tools/assign_nickname.rb +2 -2
data/lib/{analytical_brain → melete}/tools/everything_is_ready.rb +2 -2
data/lib/{analytical_brain → melete}/tools/finish_goal.rb +3 -3
data/lib/{analytical_brain → melete}/tools/goal_messaging.rb +4 -3
data/lib/{analytical_brain → melete}/tools/read_workflow.rb +2 -2
data/lib/{analytical_brain → melete}/tools/rename_session.rb +3 -3
data/lib/{analytical_brain → melete}/tools/set_goal.rb +1 -1
data/lib/{analytical_brain → melete}/tools/update_goal.rb +4 -4
data/lib/{analytical_brain.rb → melete.rb} +6 -3
data/lib/mneme/base_runner.rb +121 -0
data/lib/mneme/l2_runner.rb +14 -20
data/lib/mneme/recall_runner.rb +132 -0
data/lib/mneme/runner.rb +118 -171
data/lib/mneme/search.rb +104 -62
data/lib/mneme/tools/nothing_to_surface.rb +25 -0
data/lib/mneme/tools/save_snapshot.rb +2 -10
data/lib/mneme/tools/surface_memory.rb +89 -0
data/lib/mneme.rb +11 -5
data/lib/shell_session.rb +287 -612
data/lib/skills/definition.rb +2 -2
data/lib/skills/registry.rb +1 -1
data/lib/tools/base.rb +16 -0
data/lib/tools/bash.rb +25 -57
data/lib/tools/edit.rb +2 -0
data/lib/tools/read.rb +2 -0
data/lib/tools/registry.rb +79 -3
data/lib/tools/{recall.rb → search_messages.rb} +19 -21
data/lib/tools/spawn_specialist.rb +16 -10
data/lib/tools/spawn_subagent.rb +20 -14
data/lib/tools/subagent_prompts.rb +4 -4
data/lib/tools/think.rb +1 -1
data/lib/tools/{remember.rb → view_messages.rb} +10 -10
data/lib/tools/write.rb +2 -0
data/lib/tui/app.rb +5 -4
data/lib/tui/braille_spinner.rb +7 -7
data/lib/tui/decorators/base_decorator.rb +24 -3
data/lib/tui/message_store.rb +93 -44
data/lib/tui/screens/chat.rb +94 -20
data/lib/tui/settings.rb +9 -2
data/lib/workflows/definition.rb +3 -3
data/lib/workflows/registry.rb +1 -1
data/skills/github.md +38 -0
data/templates/config.toml +4 -23
data/workflows/review_pr.md +18 -14
metadata +86 -28
data/app/jobs/agent_request_job.rb +0 -199
data/app/jobs/analytical_brain_job.rb +0 -33
data/app/jobs/count_message_tokens_job.rb +0 -39
data/app/jobs/passive_recall_job.rb +0 -24
data/app/models/concerns/message/broadcasting.rb +0 -86
data/lib/agent_loop.rb +0 -215
data/lib/analytical_brain/tools/deactivate_skill.rb +0 -40
data/lib/analytical_brain/tools/deactivate_workflow.rb +0 -35
data/lib/events/agent_message.rb +0 -25
data/lib/events/subscribers/message_collector.rb +0 -64
data/lib/events/tool_call.rb +0 -31
data/lib/events/tool_response.rb +0 -33
data/lib/mneme/compressed_viewport.rb +0 -204
data/lib/mneme/passive_recall.rb +0 -138

data/lib/llm/client.rb CHANGED Viewed

@@ -1,15 +1,26 @@
 # frozen_string_literal: true
 module LLM
-  # Convenience layer over {Providers::Anthropic} for sending messages
-  # and handling tool execution loops.
+  # Convenience layer over {Providers::Anthropic} for phantom sessions
+  # (Mneme, Melete, Mneme::L2Runner) that need a multi-round tool-use
+  # loop driven from plain Ruby objects rather than the main drain
+  # pipeline.
+  #
+  # The main agent loop does NOT use this class — {DrainJob} talks to
+  # the provider directly and emits {Events::LLMResponded} for
+  # {Events::Subscribers::LLMResponseHandler} to process. The tool loop
+  # here is deliberately minimal: no events, no AASM transitions, no
+  # interrupt handling — phantom sessions don't interact with those
+  # machineries.
   #
   # @example
   #   registry = Tools::Registry.new
-  #   registry.register(Tools::WebGet)
-  #   client.chat_with_tools(messages, registry: registry, session_id: session.id)
+  #   registry.register(Tools::SaveSnapshot)
+  #   client.chat_with_tools(messages, registry: registry)
   class Client
-    # Synthetic tool_result when a tool is skipped because the human pressed Escape.
+    # Synthetic tool_result text shown when a tool run is aborted by the
+    # user's Escape press. Mirrored into the interrupt subsystem so both
+    # the bash tool and any future interrupt handler share the phrasing.
     INTERRUPT_MESSAGE = "Your human wants your attention"
     # @return [Providers::Anthropic] the underlying API provider
@@ -33,31 +44,20 @@ module LLM
       @logger = logger
     end
-    # Send messages with tool support. Runs the full tool execution loop:
-    # call LLM, execute any requested tools, feed results back, repeat
-    # until the LLM produces a final text response.
-    #
-    # Emits {Events::ToolCall} and {Events::ToolResponse} events for each
-    # tool interaction so they're persisted and visible in the event stream.
+    # Runs a minimal multi-round tool-use cycle: call the LLM, execute
+    # any requested tools, feed results back, repeat until the LLM
+    # produces a final text response.
     #
-    # When the user interrupts via Escape, remaining tools receive synthetic
-    # "Your human wants your attention" results and the loop exits without another LLM call.
+    # Intended for phantom sessions (Mneme, Melete). No events are
+    # emitted and no persistence happens — the caller is responsible
+    # for capturing whatever state the tool runs produce.
     #
     # @param messages [Array<Hash>] conversation messages in Anthropic format
     # @param registry [Tools::Registry] registered tools to make available
-    # @param session_id [Integer, String] session ID for emitted events
-    # @param first_response [Hash, nil] pre-fetched first API response from
-    #   {AgentLoop#deliver!}. Skips the first API call when provided so
-    #   the Bounce Back transaction doesn't duplicate work.
-    # @param between_rounds [#call, nil] callback invoked after each tool
-    #   round completes, before the next LLM request. Must return an
-    #   +Array<String>+ of message contents to inject (e.g. promoted
-    #   pending messages). Injected as +text+ blocks alongside
-    #   +tool_result+ blocks so the LLM sees them in the next round.
     # @param options [Hash] additional API parameters (e.g. +system:+)
-    # @return [Hash, nil] +:text+ (String) and +:api_metrics+ (Hash), or nil when interrupted
+    # @return [Hash] +:text+ (String) and +:api_metrics+ (Hash)
     # @raise [Providers::Anthropic::Error] on API errors
-    def chat_with_tools(messages, registry:, session_id:, first_response: nil, between_rounds: nil, **options)
+    def chat_with_tools(messages, registry:, **options)
       messages = messages.dup
       rounds = 0
       last_api_metrics = nil
@@ -69,49 +69,26 @@ module LLM
           return {text: "[Tool loop exceeded #{max_rounds} rounds — halting]", api_metrics: last_api_metrics}
         end
-        response = if first_response && rounds == 1
-          first_response
-        else
-          broadcast_session_state(session_id, "llm_generating")
-          provider.create_message(
-            model: model,
-            messages: messages,
-            max_tokens: max_tokens,
-            tools: registry.schemas,
-            include_metrics: true,
-            **options
-          )
-        end
+        response = provider.create_message(
+          model: model,
+          messages: messages,
+          max_tokens: max_tokens,
+          tools: registry.schemas,
+          include_metrics: true,
+          **options
+        )
-        # Capture api_metrics from ApiResponse wrapper (nil for pre-fetched first_response)
         last_api_metrics = response.api_metrics if response.respond_to?(:api_metrics)
         log(:debug, "stop_reason=#{response["stop_reason"]} content_types=#{(response["content"] || []).map { |b| b["type"] }.join(",")}")
         if response["stop_reason"] == "tool_use"
-          tool_results = execute_tools(response, registry, session_id)
-          promoted = promote_between_rounds(between_rounds)
-          # Dual injection: user messages go as text blocks within the current
-          # tool_results turn (same speaker); sub-agent messages append as
-          # separate assistant→user turn pairs (distinct tool invocations).
-          promoted[:texts].each { |text| tool_results << {type: "text", text: text} }
+          tool_results = execute_tools(response, registry)
           messages += [
             {role: "assistant", content: response["content"]},
             {role: "user", content: tool_results}
           ]
-          messages.concat(promoted[:pairs])
-          return nil if handle_interrupt!(session_id)
         else
-          # Discard the text response if the user pressed Escape while
-          # the API was generating it. Without this check the interrupt
-          # flag set during the blocking API call would be silently
-          # cleared by the ensure block in AgentRequestJob.
-          return nil if handle_interrupt!(session_id)
           return {text: extract_text(response), api_metrics: last_api_metrics}
         end
       end
@@ -119,26 +96,12 @@ module LLM
     private
-    # Invokes the between_rounds callback and returns promoted messages
-    # split by injection strategy.
-    #
-    # @param between_rounds [#call, nil] callback returning
-    #   +{texts: Array<String>, pairs: Array<Hash>}+
-    # @return [Hash{Symbol => Array}] +:texts+ for user messages (text blocks
-    #   in current tool_results), +:pairs+ for sub-agent messages (separate
-    #   conversation turns)
-    def promote_between_rounds(between_rounds)
-      return {texts: [], pairs: []} unless between_rounds
-      between_rounds.call
-    end
     def build_provider(provider)
       provider || Providers::Anthropic.new
     end
     def extract_text(response)
       content = response["content"] || []
       content
         .select { |block| block["type"] == "text" }
         .map { |block| block["text"] }
@@ -150,157 +113,36 @@ module LLM
       content.select { |block| block["type"] == "tool_use" }
     end
-    # Executes all tool_use blocks from a response, emitting events for each.
-    # Checks for user interrupt between tools — remaining tools receive
-    # synthetic results to satisfy the Anthropic API's tool_use/tool_result
-    # pairing requirement (a missing result permanently breaks the conversation).
-    #
-    # @param response [Hash] Anthropic API response with tool_use content blocks
-    # @param registry [Tools::Registry] tool registry for dispatch
-    # @param session_id [Integer, String] session ID for events
-    # @return [Array<Hash>] tool_result content blocks for the next API call
-    def execute_tools(response, registry, session_id)
-      tool_uses = extract_tool_uses(response)
-      results = []
-      interrupted = false
-      tool_uses.each_with_index do |tool_use, index|
-        # Check-only here; clearing happens in handle_interrupt! after the loop
-        interrupted ||= interrupt_requested?(session_id)
-        if interrupted
-          remaining = tool_uses[index..]
-          results.concat(interrupt_remaining_tools(remaining, session_id)) if remaining&.any?
-          break
-        end
-        results << execute_single_tool(tool_use, registry, session_id)
-      end
-      results
-    end
-    # Creates synthetic "Your human wants your attention" results for all tools in the list.
-    #
-    # @param tool_uses [Array<Hash>] remaining tool_use content blocks
-    # @param session_id [Integer, String] session ID for events
-    # @return [Array<Hash>] tool_result content blocks
-    def interrupt_remaining_tools(tool_uses, session_id)
-      tool_uses.map { |tool_use| interrupt_tool(tool_use, session_id) }
+    # Executes every +tool_use+ block from the response and returns
+    # matching +tool_result+ blocks. Always emits a result — a missing
+    # result permanently corrupts the Anthropic conversation history.
+    def execute_tools(response, registry)
+      extract_tool_uses(response).map { |tool_use| execute_single_tool(tool_use, registry) }
     end
-    # Executes a single tool and always returns a tool_result — even if the
-    # tool raises. Per the Anthropic tool-use protocol, every tool_use must
-    # have a matching tool_result; a missing result permanently corrupts the
-    # conversation history and breaks the session.
-    #
-    # Falls back to SecureRandom.uuid when Anthropic omits the tool_use id,
-    # ensuring the ToolCall/ToolResponse pair always shares a valid identifier.
-    def execute_single_tool(tool_use, registry, session_id)
+    def execute_single_tool(tool_use, registry)
       name = tool_use["name"]
       id = tool_use["id"] || SecureRandom.uuid
       input = tool_use["input"] || {}
-      timeout = input["timeout"] || Anima::Settings.tool_timeout
       log(:debug, "tool_call: #{name}(#{input.to_json})")
-      broadcast_session_state(session_id, "tool_executing", tool: name)
-      Events::Bus.emit(Events::ToolCall.new(
-        content: "Calling #{name}", tool_name: name,
-        tool_input: input, tool_use_id: id, timeout: timeout,
-        session_id: session_id
-      ))
       result = registry.execute(name, input)
       result = ToolDecorator.call(name, result)
       result_content = format_tool_result(result)
       result_content = truncate_tool_result(result_content, registry, name)
-      log(:debug, "tool_result: #{name} → #{result_content.to_s.truncate(200)}")
-      Events::Bus.emit(Events::ToolResponse.new(
-        content: result_content, tool_name: name, tool_use_id: id,
-        success: !result.is_a?(Hash) || !result.key?(:error),
-        session_id: session_id
-      ))
+      log(:debug, "tool_result: #{name} → #{result_content.to_s.truncate(200)}")
       {type: "tool_result", tool_use_id: id, content: result_content}
     rescue => error
       error_detail = "#{error.class}: #{error.message}"
       Rails.logger.error("Tool #{name} raised #{error_detail}")
-      error_content = format_tool_result(error: error_detail)
-      # Emission can fail (e.g. encoding errors in ActionCable/SQLite),
-      # but losing the tool_result would permanently corrupt the session.
-      begin
-        Events::Bus.emit(Events::ToolResponse.new(
-          content: error_content, tool_name: name, tool_use_id: id,
-          success: false, session_id: session_id
-        ))
-      rescue => emit_error
-        Rails.logger.error("ToolResponse emission failed: #{emit_error.class}: #{emit_error.message}")
-      end
-      {type: "tool_result", tool_use_id: id, content: error_content}
-    end
-    # Creates a synthetic "Your human wants your attention" result for a tool that was not
-    # executed due to user interrupt. Emits both ToolCall and ToolResponse
-    # events so the TUI shows the interrupted tool in the event stream.
-    #
-    # @param tool_use [Hash] Anthropic tool_use content block
-    # @param session_id [Integer, String] session ID for events
-    # @return [Hash] tool_result content block
-    def interrupt_tool(tool_use, session_id)
-      name = tool_use["name"]
-      id = tool_use["id"] || SecureRandom.uuid
-      input = tool_use["input"] || {}
-      Events::Bus.emit(Events::ToolCall.new(
-        content: "Skipped #{name} — your human wants your attention", tool_name: name,
-        tool_input: input, tool_use_id: id, session_id: session_id
-      ))
-      Events::Bus.emit(Events::ToolResponse.new(
-        content: INTERRUPT_MESSAGE, tool_name: name, tool_use_id: id,
-        success: false, session_id: session_id
-      ))
-      {type: "tool_result", tool_use_id: id, content: INTERRUPT_MESSAGE}
-    end
-    # Checks whether the session has a pending interrupt flag.
-    #
-    # @param session_id [Integer, String] session to check
-    # @return [Boolean] true when interrupt is pending
-    def interrupt_requested?(session_id)
-      Session.where(id: session_id, interrupt_requested: true).exists?
-    end
-    # Atomically checks for a pending interrupt and clears it in one query.
-    # Used at loop boundaries (after tools, before LLM text return) to
-    # short-circuit the agent loop when the user presses Escape.
-    #
-    # @param session_id [Integer, String] session to check
-    # @return [Boolean] true when interrupt was detected and cleared
-    def handle_interrupt!(session_id)
-      Session.where(id: session_id, interrupt_requested: true)
-        .update_all(interrupt_requested: false) > 0
-    end
-    # Broadcasts a session state transition to all subscribed clients.
-    # Delegates to {Session#broadcast_session_state} which handles both
-    # the session's own stream and the parent's stream for HUD updates.
-    #
-    # @param session_id [Integer, String] session to broadcast for
-    # @param state [String] one of "idle", "llm_generating", "tool_executing", "interrupting"
-    # @param tool [String, nil] tool name when state is "tool_executing"
-    # @return [void]
-    def broadcast_session_state(session_id, state, tool: nil)
-      Session.find_by(id: session_id)&.broadcast_session_state(state, tool: tool)
+      {type: "tool_result", tool_use_id: id, content: format_tool_result(error: error_detail)}
     end
     def log(level, message)
       return unless @logger
       @logger.public_send(level, message)
     end
@@ -308,8 +150,6 @@ module LLM
       result.is_a?(Hash) ? result.to_json : result.to_s
     end
-    # Applies head+tail truncation when a tool result exceeds the tool's
-    # configured character threshold. Skips tools that opt out (e.g. read).
     def truncate_tool_result(content, registry, tool_name)
       threshold = registry.truncation_threshold(tool_name)
       return content unless threshold

data/lib/mcp/client_manager.rb CHANGED Viewed

@@ -3,81 +3,76 @@
 require "mcp"
 module Mcp
-  # Manages MCP client connections and registers their tools with
-  # {Tools::Registry}. Each configured server (HTTP or stdio) gets
-  # a dedicated {MCP::Client} instance. Tool lists are fetched once
-  # during registration and cached in the registry — subsequent LLM
-  # turns reuse the same tool set without re-querying servers.
+  # Connects to MCP servers and registers their tools with
+  # {Tools::Registry}. Each configured server (HTTP or stdio) gets a
+  # dedicated {MCP::Client} instance, cached for the worker's
+  # lifetime. Connection failures are logged and skipped — a
+  # misconfigured or unavailable server does not prevent other servers
+  # or built-in tools from working.
   #
-  # Connection failures are logged and skipped — a misconfigured or
-  # unavailable server does not prevent other servers or built-in
-  # tools from working.
+  # Spawned stdio processes are reaped on worker exit via
+  # {Mcp::StdioTransport.cleanup_all}.
+  #
+  # The cache is built once on the first {#register_tools} call and
+  # never invalidated; edits to +mcp.toml+ require a worker restart.
   #
   # @example
-  #   manager = Mcp::ClientManager.new
-  #   manager.register_tools(registry)
+  #   Mcp::ClientManager.shared.register_tools(registry)
   class ClientManager
+    # Lazily-instantiated process-wide manager. Production code should
+    # call {.shared}; {.new} is reserved for tests and internal use.
+    # @return [Mcp::ClientManager]
+    def self.shared
+      @shared ||= new
+    end
     # @param config [Mcp::Config] injectable config for testing
     def initialize(config: Config.new(logger: Rails.logger))
       @config = config
     end
-    # Connects to all configured MCP servers and registers their tools
-    # in the given registry. Returns warnings for servers that failed
-    # to load so the caller can surface them to the user.
+    # Connects to every configured MCP server on first call, caches
+    # the resulting tool wrappers, and registers them in the given
+    # registry.
     #
     # @param registry [Tools::Registry] the registry to add tools to
-    # @return [Array<String>] warning messages for servers that failed
+    # @return [Array<String>] warning messages from configuration plus
+    #   any per-server load failures
     def register_tools(registry)
-      warnings = []
-      register_transport_tools(@config.http_servers, registry, warnings) { |server| build_http_client(server) }
-      register_transport_tools(@config.stdio_servers, registry, warnings) { |server| build_stdio_client(server) }
-      @config.warnings + warnings
+      load_servers if @wrappers.nil?
+      @wrappers.each { |wrapper| registry.register(wrapper) }
+      @config.warnings + @warnings
     end
     private
-    # Iterates server configs, builds a client for each via the block,
-    # and registers the server's tools. Failures are logged and collected.
-    #
-    # @param servers [Array<Hash>] server configs from {Mcp::Config}
-    # @param registry [Tools::Registry] registry to register tools in
-    # @param warnings [Array<String>] collects failure messages
-    # @yield [server] block that builds an {MCP::Client} for the server
-    def register_transport_tools(servers, registry, warnings)
+    def load_servers
+      @wrappers = []
+      @warnings = []
+      register_transport_tools(@config.http_servers) { |server| build_http_client(server) }
+      register_transport_tools(@config.stdio_servers) { |server| build_stdio_client(server) }
+    end
+    def register_transport_tools(servers)
       servers.each do |server|
         client = yield(server)
-        register_server_tools(server[:name], client, registry)
+        wrappers = client.tools.map { |mcp_tool|
+          Tools::McpTool.new(server_name: server[:name], mcp_client: client, mcp_tool: mcp_tool)
+        }
+        @wrappers.concat(wrappers)
+        Rails.logger.info("MCP: registered #{wrappers.size} tools from #{server[:name]}")
       rescue => error
         message = "MCP: failed to load tools from #{server[:name]}: #{error.message}"
         Rails.logger.warn(message)
-        warnings << message
+        @warnings << message
       end
     end
-    # Fetches tools from an MCP client and registers them with
-    # namespaced names in the registry.
-    #
-    # @param server_name [String] server name for tool namespacing
-    # @param client [MCP::Client] connected MCP client
-    # @param registry [Tools::Registry] registry to register tools in
-    def register_server_tools(server_name, client, registry)
-      count = client.tools.map { |mcp_tool|
-        Tools::McpTool.new(server_name: server_name, mcp_client: client, mcp_tool: mcp_tool)
-      }.each { |wrapper| registry.register(wrapper) }.size
-      Rails.logger.info("MCP: registered #{count} tools from #{server_name}")
-    end
-    # @param server [Hash] server config with +:url+ and +:headers+
-    # @return [MCP::Client]
     def build_http_client(server)
       transport = MCP::Client::HTTP.new(url: server[:url], headers: server[:headers])
       MCP::Client.new(transport: transport)
     end
-    # @param server [Hash] server config with +:command+, +:args+, +:env+
-    # @return [MCP::Client]
     def build_stdio_client(server)
       transport = StdioTransport.new(command: server[:command], args: server[:args], env: server[:env])
       MCP::Client.new(transport: transport)

data/lib/mcp/stdio_transport.rb CHANGED Viewed

@@ -115,8 +115,11 @@ module Mcp
       @wait_thread&.alive? || false
     end
+    # +pgroup: true+ so {#terminate_process} can group-signal the
+    # entire descendant tree — npm/npx wrappers leak their +node+
+    # children otherwise.
     def spawn_process
-      @stdin, @stdout, @wait_thread = Open3.popen2(@env, @command, *@args)
+      @stdin, @stdout, @wait_thread = Open3.popen2(@env, @command, *@args, pgroup: true)
       @stdin.set_encoding("UTF-8")
       @stdout.set_encoding("UTF-8")
       self.class.register(self)
@@ -164,14 +167,15 @@ module Mcp
       @stdout&.close rescue IOError # rubocop:disable Style/RescueModifier
     end
-    # Sends SIGTERM and waits up to 2 seconds for the process to exit.
-    # Falls back to SIGKILL if the process does not terminate in time.
+    # Sends SIGTERM to the process group; escalates to SIGKILL on the
+    # group after +GRACEFUL_SHUTDOWN_TIMEOUT+ seconds. Negative PID
+    # signals the whole group (see {#spawn_process}).
     def terminate_process
       return unless @wait_thread
       pid = @wait_thread.pid
       begin
-        Process.kill("TERM", pid)
+        Process.kill("TERM", -pid)
       rescue Errno::ESRCH, Errno::EPERM
         return
       end
@@ -181,7 +185,7 @@ module Mcp
         _, status = Process.wait2(pid, Process::WNOHANG)
         break if status
         if Process.clock_gettime(Process::CLOCK_MONOTONIC) > deadline
-          Process.kill("KILL", pid) rescue Errno::ESRCH # rubocop:disable Style/RescueModifier
+          Process.kill("KILL", -pid) rescue Errno::ESRCH # rubocop:disable Style/RescueModifier
           Process.wait(pid) rescue Errno::ECHILD # rubocop:disable Style/RescueModifier
           break
         end