RubyGems - raix-openai-eight - Versions diffs - 1.0.1 - Mend

raix-openai-eight 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

checksums.yaml +7 -0
data/.rspec +3 -0
data/.rubocop.yml +53 -0
data/.ruby-version +1 -0
data/CHANGELOG.md +168 -0
data/CLAUDE.md +13 -0
data/CODE_OF_CONDUCT.md +84 -0
data/Gemfile +24 -0
data/Gemfile.lock +240 -0
data/Guardfile +72 -0
data/LICENSE.txt +21 -0
data/README.llm +106 -0
data/README.md +775 -0
data/Rakefile +18 -0
data/lib/mcp/sse_client.rb +297 -0
data/lib/mcp/stdio_client.rb +80 -0
data/lib/mcp/tool.rb +67 -0
data/lib/raix/chat_completion.rb +346 -0
data/lib/raix/configuration.rb +71 -0
data/lib/raix/function_dispatch.rb +132 -0
data/lib/raix/mcp.rb +255 -0
data/lib/raix/message_adapters/base.rb +50 -0
data/lib/raix/predicate.rb +68 -0
data/lib/raix/prompt_declarations.rb +166 -0
data/lib/raix/response_format.rb +81 -0
data/lib/raix/version.rb +5 -0
data/lib/raix.rb +27 -0
data/raix-openai-eight.gemspec +36 -0
data/sig/raix.rbs +4 -0
metadata +140 -0

data/lib/raix/chat_completion.rb ADDED Viewed

@@ -0,0 +1,346 @@
+# frozen_string_literal: true
+require "active_support/concern"
+require "active_support/core_ext/object/blank"
+require "active_support/core_ext/string/filters"
+require "open_router"
+require "openai"
+require_relative "message_adapters/base"
+module Raix
+  class UndeclaredToolError < StandardError; end
+  # The `ChatCompletion` module is a Rails concern that provides a way to interact
+  # with the OpenRouter Chat Completion API via its client. The module includes a few
+  # methods that allow you to build a transcript of messages and then send them to
+  # the API for completion. The API will return a response that you can use however
+  # you see fit.
+  #
+  # When the AI responds with tool function calls instead of a text message, this
+  # module automatically:
+  # 1. Executes the requested tool functions
+  # 2. Adds the function results to the conversation transcript
+  # 3. Sends the updated transcript back to the AI for another completion
+  # 4. Repeats this process until the AI responds with a regular text message
+  #
+  # This automatic continuation ensures that tool calls are seamlessly integrated
+  # into the conversation flow. The AI can use tool results to formulate its final
+  # response to the user. You can limit the number of tool calls using the
+  # `max_tool_calls` parameter to prevent excessive function invocations.
+  #
+  # Tool functions must be defined on the class that includes this module. The
+  # `FunctionDispatch` module provides a Rails-like DSL for declaring these
+  # functions at the class level, which is cleaner than implementing them as
+  # instance methods.
+  #
+  # Note that some AI models can make multiple tool function calls in a single
+  # response. When that happens, the module executes all requested functions
+  # before continuing the conversation.
+  module ChatCompletion
+    extend ActiveSupport::Concern
+    attr_accessor :cache_at, :frequency_penalty, :logit_bias, :logprobs, :loop, :min_p, :model, :presence_penalty,
+                  :prediction, :repetition_penalty, :response_format, :stream, :temperature, :max_completion_tokens,
+                  :max_tokens, :seed, :stop, :top_a, :top_k, :top_logprobs, :top_p, :tools, :available_tools, :tool_choice, :provider,
+                  :max_tool_calls, :stop_tool_calls_and_respond
+    class_methods do
+      # Returns the current configuration of this class. Falls back to global configuration for unset values.
+      def configuration
+        @configuration ||= Configuration.new(fallback: Raix.configuration)
+      end
+      # Let's you configure the class-level configuration using a block.
+      def configure
+        yield(configuration)
+      end
+    end
+    # Instance level access to the class-level configuration.
+    def configuration
+      self.class.configuration
+    end
+    # This method performs chat completion based on the provided transcript and parameters.
+    #
+    # @param params [Hash] The parameters for chat completion.
+    # @option loop [Boolean] :loop (false) DEPRECATED - The system now automatically continues after tool calls.
+    # @option params [Boolean] :json (false) Whether to return the parse the response as a JSON object. Will search for <json> tags in the response first, then fall back to the default JSON parsing of the entire response.
+    # @option params [String] :openai (nil) If non-nil, use OpenAI with the model specified in this param.
+    # @option params [Boolean] :raw (false) Whether to return the raw response or dig the text content.
+    # @option params [Array] :messages (nil) An array of messages to use instead of the transcript.
+    # @option tools [Array|false] :available_tools (nil) Tools to pass to the LLM. Ignored if nil (default). If false, no tools are passed. If an array, only declared tools in the array are passed.
+    # @option max_tool_calls [Integer] :max_tool_calls Maximum number of tool calls before forcing a text response. Defaults to the configured value.
+    # @return [String|Hash] The completed chat response.
+    def chat_completion(params: {}, loop: false, json: false, raw: false, openai: nil, save_response: true, messages: nil, available_tools: nil, max_tool_calls: nil)
+      # set params to default values if not provided
+      params[:cache_at] ||= cache_at.presence
+      params[:frequency_penalty] ||= frequency_penalty.presence
+      params[:logit_bias] ||= logit_bias.presence
+      params[:logprobs] ||= logprobs.presence
+      params[:max_completion_tokens] ||= max_completion_tokens.presence || configuration.max_completion_tokens
+      params[:max_tokens] ||= max_tokens.presence || configuration.max_tokens
+      params[:min_p] ||= min_p.presence
+      params[:prediction] = { type: "content", content: params[:prediction] || prediction } if params[:prediction] || prediction.present?
+      params[:presence_penalty] ||= presence_penalty.presence
+      params[:provider] ||= provider.presence
+      params[:repetition_penalty] ||= repetition_penalty.presence
+      params[:response_format] ||= response_format.presence
+      params[:seed] ||= seed.presence
+      params[:stop] ||= stop.presence
+      params[:temperature] ||= temperature.presence || configuration.temperature
+      params[:tool_choice] ||= tool_choice.presence
+      params[:tools] = if available_tools == false
+                         nil
+                       elsif available_tools.is_a?(Array)
+                         filtered_tools(available_tools)
+                       else
+                         tools.presence
+                       end
+      params[:top_a] ||= top_a.presence
+      params[:top_k] ||= top_k.presence
+      params[:top_logprobs] ||= top_logprobs.presence
+      params[:top_p] ||= top_p.presence
+      json = true if params[:response_format].is_a?(Raix::ResponseFormat)
+      if json
+        unless openai
+          params[:provider] ||= {}
+          params[:provider][:require_parameters] = true
+        end
+        if params[:response_format].blank?
+          params[:response_format] ||= {}
+          params[:response_format][:type] = "json_object"
+        end
+      end
+      # Deprecation warning for loop parameter
+      if loop
+        warn "\n\nWARNING: The 'loop' parameter is DEPRECATED and will be ignored.\nChat completions now automatically continue after tool calls until the AI provides a text response.\nUse 'max_tool_calls' to limit the number of tool calls (default: #{configuration.max_tool_calls}).\n\n"
+      end
+      # Set max_tool_calls from parameter or configuration default
+      self.max_tool_calls = max_tool_calls || configuration.max_tool_calls
+      # Reset stop_tool_calls_and_respond flag
+      @stop_tool_calls_and_respond = false
+      # Track tool call count
+      tool_call_count = 0
+      # set the model to the default if not provided
+      self.model ||= configuration.model
+      adapter = MessageAdapters::Base.new(self)
+      # duplicate the transcript to avoid race conditions in situations where
+      # chat_completion is called multiple times in parallel
+      # TODO: Defensive programming, ensure messages is an array
+      messages ||= transcript.flatten.compact
+      messages = messages.map { |msg| adapter.transform(msg) }.dup
+      raise "Can't complete an empty transcript" if messages.blank?
+      begin
+        response = if openai
+                     openai_request(params:, model: openai, messages:)
+                   else
+                     openrouter_request(params:, model:, messages:)
+                   end
+        retry_count = 0
+        content = nil
+        # no need for additional processing if streaming
+        return if stream && response.blank?
+        # tuck the full response into a thread local in case needed
+        Thread.current[:chat_completion_response] = response.with_indifferent_access
+        # TODO: add a standardized callback hook for usage events
+        # broadcast(:usage_event, usage_subject, self.class.name.to_s, response, premium?)
+        tool_calls = response.dig("choices", 0, "message", "tool_calls") || []
+        if tool_calls.any?
+          tool_call_count += tool_calls.size
+          # Check if we've exceeded max_tool_calls
+          if tool_call_count > self.max_tool_calls
+            # Add system message about hitting the limit
+            messages << { role: "system", content: "Maximum tool calls (#{self.max_tool_calls}) exceeded. Please provide a final response to the user without calling any more tools." }
+            # Force a final response without tools
+            params[:tools] = nil
+            response = if openai
+                         openai_request(params:, model: openai, messages:)
+                       else
+                         openrouter_request(params:, model:, messages:)
+                       end
+            # Process the final response
+            content = response.dig("choices", 0, "message", "content")
+            transcript << { assistant: content } if save_response
+            return raw ? response : content.strip
+          end
+          # Dispatch tool calls
+          tool_calls.each do |tool_call| # TODO: parallelize this?
+            # dispatch the called function
+            function_name = tool_call["function"]["name"]
+            arguments = JSON.parse(tool_call["function"]["arguments"].presence || "{}")
+            raise "Unauthorized function call: #{function_name}" unless self.class.functions.map { |f| f[:name].to_sym }.include?(function_name.to_sym)
+            dispatch_tool_function(function_name, arguments.with_indifferent_access)
+          end
+          # After executing tool calls, we need to continue the conversation
+          # to let the AI process the results and provide a text response.
+          # We continue until the AI responds with a regular assistant message
+          # (not another tool call request), unless stop_tool_calls_and_respond! was called.
+          # Use the updated transcript for the next call, not the original messages
+          updated_messages = transcript.flatten.compact
+          last_message = updated_messages.last
+          if !@stop_tool_calls_and_respond && (last_message[:role] != "assistant" || last_message[:tool_calls].present?)
+            # Send the updated transcript back to the AI
+            return chat_completion(
+              params:,
+              json:,
+              raw:,
+              openai:,
+              save_response:,
+              messages: nil, # Use transcript instead
+              available_tools:,
+              max_tool_calls: self.max_tool_calls - tool_call_count
+            )
+          elsif @stop_tool_calls_and_respond
+            # If stop_tool_calls_and_respond was set, force a final response without tools
+            params[:tools] = nil
+            response = if openai
+                         openai_request(params:, model: openai, messages:)
+                       else
+                         openrouter_request(params:, model:, messages:)
+                       end
+            content = response.dig("choices", 0, "message", "content")
+            transcript << { assistant: content } if save_response
+            return raw ? response : content.strip
+          end
+        end
+        response.tap do |res|
+          content = res.dig("choices", 0, "message", "content")
+          transcript << { assistant: content } if save_response
+          content = content.strip
+          if json
+            # Make automatic JSON parsing available to non-OpenAI providers that don't support the response_format parameter
+            content = content.match(%r{<json>(.*?)</json>}m)[1] if content.include?("<json>")
+            return JSON.parse(content)
+          end
+          return content unless raw
+        end
+      rescue JSON::ParserError => e
+        if e.message.include?("not a valid") # blank JSON
+          warn "Retrying blank JSON response... (#{retry_count} attempts) #{e.message}"
+          retry_count += 1
+          sleep 1 * retry_count # backoff
+          retry if retry_count < 3
+          raise e # just fail if we can't get content after 3 attempts
+        end
+        warn "Bad JSON received!!!!!!: #{content}"
+        raise e
+      rescue Faraday::BadRequestError => e
+        # make sure we see the actual error message on console or Honeybadger
+        warn "Chat completion failed!!!!!!!!!!!!!!!!: #{e.response[:body]}"
+        raise e
+      end
+    end
+    # This method returns the transcript array.
+    # Manually add your messages to it in the following abbreviated format
+    # before calling `chat_completion`.
+    #
+    # { system: "You are a pumpkin" },
+    # { user: "Hey what time is it?" },
+    # { assistant: "Sorry, pumpkins do not wear watches" }
+    #
+    # to add a function call use the following format:
+    # { function: { name: 'fancy_pants_function', arguments: { param: 'value' } } }
+    #
+    # to add a function result use the following format:
+    # { function: result, name: 'fancy_pants_function' }
+    #
+    # @return [Array] The transcript array.
+    def transcript
+      @transcript ||= []
+    end
+    # Dispatches a tool function call with the given function name and arguments.
+    # This method can be overridden in subclasses to customize how function calls are handled.
+    #
+    # @param function_name [String] The name of the function to call
+    # @param arguments [Hash] The arguments to pass to the function
+    # @param cache [ActiveSupport::Cache] Optional cache object
+    # @return [Object] The result of the function call
+    def dispatch_tool_function(function_name, arguments, cache: nil)
+      public_send(function_name, arguments, cache)
+    end
+    private
+    def filtered_tools(tool_names)
+      return nil if tool_names.blank?
+      requested_tools = tool_names.map(&:to_sym)
+      available_tool_names = tools.map { |tool| tool.dig(:function, :name).to_sym }
+      undeclared_tools = requested_tools - available_tool_names
+      raise UndeclaredToolError, "Undeclared tools: #{undeclared_tools.join(", ")}" if undeclared_tools.any?
+      tools.select { |tool| requested_tools.include?(tool.dig(:function, :name).to_sym) }
+    end
+    def openai_request(params:, model:, messages:)
+      if params[:prediction]
+        params.delete(:max_completion_tokens)
+      else
+        params[:max_completion_tokens] ||= params[:max_tokens]
+        params.delete(:max_tokens)
+      end
+      params[:stream] ||= stream.presence
+      params[:stream_options] = { include_usage: true } if params[:stream]
+      params.delete(:temperature) if model.start_with?("o")
+      configuration.openai_client.chat(parameters: params.compact.merge(model:, messages:))
+    end
+    def openrouter_request(params:, model:, messages:)
+      # max_completion_tokens is not supported by OpenRouter
+      params.delete(:max_completion_tokens)
+      retry_count = 0
+      begin
+        configuration.openrouter_client.complete(messages, model:, extras: params.compact, stream:)
+      rescue OpenRouter::ServerError => e
+        if e.message.include?("retry")
+          warn "Retrying OpenRouter request... (#{retry_count} attempts) #{e.message}"
+          retry_count += 1
+          sleep 1 * retry_count # backoff
+          retry if retry_count < 5
+        end
+        raise e
+      end
+    end
+  end
+end

data/lib/raix/configuration.rb ADDED Viewed

@@ -0,0 +1,71 @@
+# frozen_string_literal: true
+module Raix
+  # The Configuration class holds the configuration options for the Raix gem.
+  class Configuration
+    def self.attr_accessor_with_fallback(method_name)
+      define_method(method_name) do
+        value = instance_variable_get("@#{method_name}")
+        return value if value
+        return unless fallback
+        fallback.public_send(method_name)
+      end
+      define_method("#{method_name}=") do |value|
+        instance_variable_set("@#{method_name}", value)
+      end
+    end
+    # The temperature option determines the randomness of the generated text.
+    # Higher values result in more random output.
+    attr_accessor_with_fallback :temperature
+    # The max_tokens option determines the maximum number of tokens to generate.
+    attr_accessor_with_fallback :max_tokens
+    # The max_completion_tokens option determines the maximum number of tokens to generate.
+    attr_accessor_with_fallback :max_completion_tokens
+    # The model option determines the model to use for text generation. This option
+    # is normally set in each class that includes the ChatCompletion module.
+    attr_accessor_with_fallback :model
+    # The openrouter_client option determines the default client to use for communication.
+    attr_accessor_with_fallback :openrouter_client
+    # The openai_client option determines the OpenAI client to use for communication.
+    attr_accessor_with_fallback :openai_client
+    # The max_tool_calls option determines the maximum number of tool calls
+    # before forcing a text response to prevent excessive function invocations.
+    attr_accessor_with_fallback :max_tool_calls
+    DEFAULT_MAX_TOKENS = 1000
+    DEFAULT_MAX_COMPLETION_TOKENS = 16_384
+    DEFAULT_MODEL = "meta-llama/llama-3.3-8b-instruct:free"
+    DEFAULT_TEMPERATURE = 0.0
+    DEFAULT_MAX_TOOL_CALLS = 25
+    # Initializes a new instance of the Configuration class with default values.
+    def initialize(fallback: nil)
+      self.temperature = DEFAULT_TEMPERATURE
+      self.max_completion_tokens = DEFAULT_MAX_COMPLETION_TOKENS
+      self.max_tokens = DEFAULT_MAX_TOKENS
+      self.model = DEFAULT_MODEL
+      self.max_tool_calls = DEFAULT_MAX_TOOL_CALLS
+      self.fallback = fallback
+    end
+    private
+    attr_accessor :fallback
+    def get_with_fallback(method)
+      value = instance_variable_get("@#{method}")
+      return value if value
+      return unless fallback
+      fallback.public_send(method)
+    end
+  end
+end

data/lib/raix/function_dispatch.rb ADDED Viewed

@@ -0,0 +1,132 @@
+# frozen_string_literal: true
+require "securerandom"
+module Raix
+  # Provides declarative function definition for ChatCompletion classes.
+  #
+  # Example:
+  #
+  #   class MeaningOfLife
+  #     include Raix::ChatCompletion
+  #     include Raix::FunctionDispatch
+  #
+  #     function :ask_deep_thought do
+  #       wait 236_682_000_000_000
+  #       "The meaning of life is 42"
+  #     end
+  #
+  #     def initialize
+  #       transcript << { user: "What is the meaning of life?" }
+  #       chat_completion
+  #     end
+  #   end
+  module FunctionDispatch
+    extend ActiveSupport::Concern
+    class_methods do
+      attr_reader :functions
+      # Defines a function that can be dispatched by the ChatCompletion module while
+      # processing the response from an AI model.
+      #
+      # Declaring a function here will automatically add it (in JSON Schema format) to
+      # the list of tools provided to the OpenRouter Chat Completion API. The function
+      # will be dispatched by name, so make sure the name is unique. The function's block
+      # argument will be executed in the instance context of the class that includes this module.
+      #
+      # Example:
+      #   function :google_search, "Search Google for something", query: { type: "string" } do |arguments|
+      #     GoogleSearch.new(arguments[:query]).search
+      #   end
+      #
+      # @param name [Symbol] The name of the function.
+      # @param description [String] An optional description of the function.
+      # @param parameters [Hash] The parameters that the function accepts.
+      # @param block [Proc] The block of code to execute when the function is called.
+      def function(name, description = nil, **parameters, &block)
+        @functions ||= []
+        @functions << begin
+          {
+            name:,
+            parameters: { type: "object", properties: {}, required: [] }
+          }.tap do |definition|
+            definition[:description] = description if description.present?
+            parameters.each do |key, value|
+              value = value.dup
+              required = value.delete(:required)
+              optional = value.delete(:optional)
+              definition[:parameters][:properties][key] = value
+              if required || optional == false
+                definition[:parameters][:required] << key
+              end
+            end
+            definition[:parameters].delete(:required) if definition[:parameters][:required].empty?
+          end
+        end
+        define_method(name) do |arguments, cache|
+          id = SecureRandom.uuid[0, 23]
+          content = if cache.present?
+                      cache.fetch([name, arguments]) do
+                        instance_exec(arguments, &block)
+                      end
+                    else
+                      instance_exec(arguments, &block)
+                    end
+          # add in one operation to prevent race condition and potential wrong
+          # interleaving of tool calls in multi-threaded environments
+          transcript << [
+            {
+              role: "assistant",
+              content: nil,
+              tool_calls: [
+                {
+                  id:,
+                  type: "function",
+                  function: {
+                    name:,
+                    arguments: arguments.to_json
+                  }
+                }
+              ]
+            },
+            {
+              role: "tool",
+              tool_call_id: id,
+              name:,
+              content: content.to_s
+            }
+          ]
+          # Return the content - ChatCompletion will automatically continue
+          # the conversation after tool execution to get a final response
+          content
+        end
+      end
+    end
+    included do
+      attr_accessor :chat_completion_args
+    end
+    def chat_completion(**chat_completion_args)
+      self.chat_completion_args = chat_completion_args
+      super
+    end
+    # Stops the automatic continuation of chat completions after this function call.
+    # Useful when you want to halt processing within a function and force the AI
+    # to provide a text response without making additional tool calls.
+    def stop_tool_calls_and_respond!
+      @stop_tool_calls_and_respond = true
+    end
+    def tools
+      return [] unless self.class.functions
+      self.class.functions.map { |function| { type: "function", function: } }
+    end
+  end
+end