RubyGems - raif - Versions diffs - 1.3.0 → 1.4.0 - Mend

raif 1.3.0 → 1.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

data/app/models/raif/llms/anthropic.rb CHANGED Viewed

@@ -3,6 +3,7 @@
 class Raif::Llms::Anthropic < Raif::Llm
   include Raif::Concerns::Llms::Anthropic::MessageFormatting
   include Raif::Concerns::Llms::Anthropic::ToolFormatting
+  include Raif::Concerns::Llms::Anthropic::ResponseToolCalls
   def perform_model_completion!(model_completion, &block)
     params = build_request_parameters(model_completion)
@@ -21,7 +22,7 @@ class Raif::Llms::Anthropic < Raif::Llm
 private
   def connection
-    @connection ||= Faraday.new(url: "https://api.anthropic.com/v1") do |f|
+    @connection ||= Faraday.new(url: "https://api.anthropic.com/v1", request: Raif.default_request_options) do |f|
       f.headers["x-api-key"] = Raif.config.anthropic_api_key
       f.headers["anthropic-version"] = "2023-06-01"
       f.request :json
@@ -64,6 +65,11 @@ private
     if supports_native_tool_use?
       tools = build_tools_parameter(model_completion)
       params[:tools] = tools unless tools.blank?
+      if model_completion.tool_choice.present?
+        tool_klass = model_completion.tool_choice.constantize
+        params[:tool_choice] = build_forced_tool_choice(tool_klass.tool_name)
+      end
     end
     params[:stream] = true if model_completion.stream_response?
@@ -92,24 +98,6 @@ private
     end
   end
-  def extract_response_tool_calls(resp)
-    return if resp&.dig("content").nil?
-    # Find any tool_use content blocks
-    tool_uses = resp&.dig("content")&.select do |content|
-      content["type"] == "tool_use"
-    end
-    return if tool_uses.blank?
-    tool_uses.map do |tool_use|
-      {
-        "name" => tool_use["name"],
-        "arguments" => tool_use["input"]
-      }
-    end
-  end
   def extract_citations(resp)
     return [] if resp&.dig("content").nil?

data/app/models/raif/llms/bedrock.rb CHANGED Viewed

@@ -3,6 +3,7 @@
 class Raif::Llms::Bedrock < Raif::Llm
   include Raif::Concerns::Llms::Bedrock::MessageFormatting
   include Raif::Concerns::Llms::Bedrock::ToolFormatting
+  include Raif::Concerns::Llms::Bedrock::ResponseToolCalls
   def perform_model_completion!(model_completion, &block)
     if Raif.config.aws_bedrock_model_name_prefix.present?
@@ -72,6 +73,11 @@ private
     if supports_native_tool_use?
       tools = build_tools_parameter(model_completion)
       params[:tool_config] = tools unless tools.blank?
+      if model_completion.tool_choice.present?
+        tool_klass = model_completion.tool_choice.constantize
+        params[:tool_config][:tool_choice] = build_forced_tool_choice(tool_klass.tool_name)
+      end
     end
     params
@@ -121,26 +127,6 @@ private
     end
   end
-  def extract_response_tool_calls(resp)
-    # Get the message from the response object
-    message = resp.output.message
-    return if message.content.nil?
-    # Find any tool_use blocks in the content array
-    tool_uses = message.content.select do |content|
-      content.respond_to?(:tool_use) && content.tool_use.present?
-    end
-    return if tool_uses.blank?
-    tool_uses.map do |content|
-      {
-        "name" => content.tool_use.name,
-        "arguments" => content.tool_use.input
-      }
-    end
-  end
   def streaming_chunk_handler(model_completion, &block)
     return unless model_completion.stream_response?

data/app/models/raif/llms/google.rb ADDED Viewed

@@ -0,0 +1,140 @@
+# frozen_string_literal: true
+class Raif::Llms::Google < Raif::Llm
+  include Raif::Concerns::Llms::Google::MessageFormatting
+  include Raif::Concerns::Llms::Google::ToolFormatting
+  include Raif::Concerns::Llms::Google::ResponseToolCalls
+  def perform_model_completion!(model_completion, &block)
+    params = build_request_parameters(model_completion)
+    endpoint = build_endpoint(model_completion)
+    response = connection.post(endpoint) do |req|
+      req.body = params
+      req.options.on_data = streaming_chunk_handler(model_completion, &block) if model_completion.stream_response?
+    end
+    unless model_completion.stream_response?
+      update_model_completion(model_completion, response.body)
+    end
+    model_completion
+  end
+private
+  def connection
+    @connection ||= Faraday.new(url: "https://generativelanguage.googleapis.com/v1beta") do |f|
+      f.headers["x-goog-api-key"] = Raif.config.google_api_key
+      f.request :json
+      f.response :json
+      f.response :raise_error
+    end
+  end
+  def build_endpoint(model_completion)
+    if model_completion.stream_response?
+      "models/#{model_completion.model_api_name}:streamGenerateContent?alt=sse"
+    else
+      "models/#{model_completion.model_api_name}:generateContent"
+    end
+  end
+  def streaming_response_type
+    Raif::StreamingResponses::Google
+  end
+  def update_model_completion(model_completion, response_json)
+    model_completion.raw_response = if model_completion.response_format_json?
+      extract_json_response(response_json)
+    else
+      extract_text_response(response_json)
+    end
+    model_completion.response_array = response_json&.dig("candidates", 0, "content", "parts")
+    model_completion.response_tool_calls = extract_response_tool_calls(response_json)
+    model_completion.citations = extract_citations(response_json)
+    model_completion.completion_tokens = response_json&.dig("usageMetadata", "candidatesTokenCount")
+    model_completion.prompt_tokens = response_json&.dig("usageMetadata", "promptTokenCount")
+    model_completion.total_tokens = response_json&.dig("usageMetadata", "totalTokenCount") ||
+      (model_completion.completion_tokens.to_i + model_completion.prompt_tokens.to_i)
+    model_completion.save!
+  end
+  def build_request_parameters(model_completion)
+    params = {
+      contents: model_completion.messages
+    }
+    if model_completion.system_prompt.present?
+      params[:system_instruction] = { parts: [{ text: model_completion.system_prompt }] }
+    end
+    params[:generationConfig] = build_generation_config(model_completion)
+    if supports_native_tool_use?
+      tools = build_tools_parameter(model_completion)
+      params[:tools] = tools unless tools.blank?
+      if model_completion.tool_choice.present?
+        tool_klass = model_completion.tool_choice.constantize
+        params[:toolConfig] = { functionCallingConfig: build_forced_tool_choice(tool_klass.tool_name) }
+      end
+    end
+    params
+  end
+  def build_generation_config(model_completion)
+    config = {}
+    temperature = model_completion.temperature || default_temperature
+    config[:temperature] = temperature.to_f if temperature.present?
+    max_tokens = model_completion.max_completion_tokens || default_max_completion_tokens
+    config[:maxOutputTokens] = max_tokens if max_tokens.present?
+    # Use native JSON schema support for structured output
+    if model_completion.response_format_json? && model_completion.json_response_schema.present?
+      config[:responseMimeType] = "application/json"
+      config[:responseSchema] = sanitize_schema_for_google(model_completion.json_response_schema)
+    end
+    config
+  end
+  def extract_text_response(resp)
+    parts = resp&.dig("candidates", 0, "content", "parts")
+    return if parts.blank?
+    parts.select { |p| p.key?("text") }.map { |p| p["text"] }.join
+  end
+  def extract_json_response(resp)
+    # Google AI supports native JSON schema output, so the response should be in the text field
+    extract_text_response(resp)
+  end
+  def extract_citations(resp)
+    # Google AI returns grounding metadata for search results
+    grounding_metadata = resp&.dig("candidates", 0, "groundingMetadata")
+    return [] if grounding_metadata.blank?
+    citations = []
+    # Extract from grounding chunks
+    grounding_chunks = grounding_metadata["groundingChunks"] || []
+    grounding_chunks.each do |chunk|
+      web = chunk["web"]
+      next unless web.present?
+      citations << {
+        "url" => Raif::Utils::HtmlFragmentProcessor.strip_tracking_parameters(web["uri"]),
+        "title" => web["title"]
+      }
+    end
+    citations.uniq { |citation| citation["url"] }
+  end
+end

data/app/models/raif/llms/open_ai_base.rb CHANGED Viewed

@@ -28,11 +28,25 @@ class Raif::Llms::OpenAiBase < Raif::Llm
 private
   def connection
-    @connection ||= Faraday.new(url: "https://api.openai.com/v1") do |f|
-      f.headers["Authorization"] = "Bearer #{Raif.config.open_ai_api_key}"
-      f.request :json
-      f.response :json
-      f.response :raise_error
+    @connection ||= begin
+      conn = Faraday.new(url: Raif.config.open_ai_base_url, request: Raif.default_request_options) do |f|
+        case Raif.config.open_ai_auth_header_style
+        when :bearer
+          f.headers["Authorization"] = "Bearer #{Raif.config.open_ai_api_key}"
+        when :api_key
+          f.headers["api-key"] = Raif.config.open_ai_api_key
+        else
+          raise Raif::Errors::InvalidConfigError,
+            "Raif.config.open_ai_auth_header_style must be either :bearer or :api_key"
+        end
+        f.request :json
+        f.response :json
+        f.response :raise_error
+      end
+      conn.params["api-version"] = Raif.config.open_ai_api_version if Raif.config.open_ai_api_version.present?
+      conn
     end
   end

data/app/models/raif/llms/open_ai_completions.rb CHANGED Viewed

@@ -3,6 +3,7 @@
 class Raif::Llms::OpenAiCompletions < Raif::Llms::OpenAiBase
   include Raif::Concerns::Llms::OpenAiCompletions::MessageFormatting
   include Raif::Concerns::Llms::OpenAiCompletions::ToolFormatting
+  include Raif::Concerns::Llms::OpenAiCompletions::ResponseToolCalls
 private
@@ -26,17 +27,6 @@ private
     )
   end
-  def extract_response_tool_calls(resp)
-    return if resp.dig("choices", 0, "message", "tool_calls").blank?
-    resp.dig("choices", 0, "message", "tool_calls").map do |tool_call|
-      {
-        "name" => tool_call["function"]["name"],
-        "arguments" => JSON.parse(tool_call["function"]["arguments"])
-      }
-    end
-  end
   def build_request_parameters(model_completion)
     formatted_system_prompt = format_system_prompt(model_completion)
@@ -60,6 +50,11 @@ private
     if supports_native_tool_use?
       tools = build_tools_parameter(model_completion)
       parameters[:tools] = tools unless tools.blank?
+      if model_completion.tool_choice.present?
+        tool_klass = model_completion.tool_choice.constantize
+        parameters[:tool_choice] = build_forced_tool_choice(tool_klass.tool_name)
+      end
     end
     if model_completion.stream_response?

data/app/models/raif/llms/open_ai_responses.rb CHANGED Viewed

@@ -3,6 +3,7 @@
 class Raif::Llms::OpenAiResponses < Raif::Llms::OpenAiBase
   include Raif::Concerns::Llms::OpenAiResponses::MessageFormatting
   include Raif::Concerns::Llms::OpenAiResponses::ToolFormatting
+  include Raif::Concerns::Llms::OpenAiResponses::ResponseToolCalls
 private
@@ -27,22 +28,6 @@ private
     )
   end
-  def extract_response_tool_calls(resp)
-    return if resp["output"].blank?
-    tool_calls = []
-    resp["output"].each do |output_item|
-      next unless output_item["type"] == "function_call"
-      tool_calls << {
-        "name" => output_item["name"],
-        "arguments" => JSON.parse(output_item["arguments"])
-      }
-    end
-    tool_calls.any? ? tool_calls : nil
-  end
   def extract_raw_response(resp)
     text_outputs = []
@@ -110,6 +95,11 @@ private
     if supports_native_tool_use?
       tools = build_tools_parameter(model_completion)
       parameters[:tools] = tools unless tools.blank?
+      if model_completion.tool_choice.present?
+        tool_klass = model_completion.tool_choice.constantize
+        parameters[:tool_choice] = build_forced_tool_choice(tool_klass.tool_name)
+      end
     end
     # Add response format if needed. Default will be { "type": "text" }

data/app/models/raif/llms/open_router.rb CHANGED Viewed

@@ -3,6 +3,7 @@
 class Raif::Llms::OpenRouter < Raif::Llm
   include Raif::Concerns::Llms::OpenAiCompletions::MessageFormatting
   include Raif::Concerns::Llms::OpenAiCompletions::ToolFormatting
+  include Raif::Concerns::Llms::OpenAiCompletions::ResponseToolCalls
   include Raif::Concerns::Llms::OpenAi::JsonSchemaValidation
   def perform_model_completion!(model_completion, &block)
@@ -23,7 +24,7 @@ class Raif::Llms::OpenRouter < Raif::Llm
 private
   def connection
-    @connection ||= Faraday.new(url: "https://openrouter.ai/api/v1") do |f|
+    @connection ||= Faraday.new(url: "https://openrouter.ai/api/v1", request: Raif.default_request_options) do |f|
       f.headers["Authorization"] = "Bearer #{Raif.config.open_router_api_key}"
       f.headers["HTTP-Referer"] = Raif.config.open_router_site_url if Raif.config.open_router_site_url.present?
       f.headers["X-Title"] = Raif.config.open_router_app_name if Raif.config.open_router_app_name.present?
@@ -85,6 +86,11 @@ private
       end
       params[:tools] = tools unless tools.blank?
+      if model_completion.tool_choice.present?
+        tool_klass = model_completion.tool_choice.constantize
+        params[:tool_choice] = build_forced_tool_choice(tool_klass.tool_name)
+      end
     end
     if model_completion.stream_response?
@@ -121,16 +127,4 @@ private
       extract_text_response(resp)
     end
   end
-  def extract_response_tool_calls(resp)
-    tool_calls = resp.dig("choices", 0, "message", "tool_calls")
-    return if tool_calls.blank?
-    tool_calls.map do |tool_call|
-      {
-        "name" => tool_call["function"]["name"],
-        "arguments" => JSON.parse(tool_call["function"]["arguments"])
-      }
-    end
-  end
 end

data/app/models/raif/model_completion.rb CHANGED Viewed

@@ -1,14 +1,68 @@
 # frozen_string_literal: true
+# == Schema Information
+#
+# Table name: raif_model_completions
+#
+#  id                        :bigint           not null, primary key
+#  available_model_tools     :jsonb            not null
+#  citations                 :jsonb
+#  completed_at              :datetime
+#  completion_tokens         :integer
+#  failed_at                 :datetime
+#  failure_error             :string
+#  failure_reason            :text
+#  llm_model_key             :string           not null
+#  max_completion_tokens     :integer
+#  messages                  :jsonb            not null
+#  model_api_name            :string           not null
+#  output_token_cost         :decimal(10, 6)
+#  prompt_token_cost         :decimal(10, 6)
+#  prompt_tokens             :integer
+#  raw_response              :text
+#  response_array            :jsonb
+#  response_format           :integer          default("text"), not null
+#  response_format_parameter :string
+#  response_tool_calls       :jsonb
+#  retry_count               :integer          default(0), not null
+#  source_type               :string
+#  started_at                :datetime
+#  stream_response           :boolean          default(FALSE), not null
+#  system_prompt             :text
+#  temperature               :decimal(5, 3)
+#  tool_choice               :string
+#  total_cost                :decimal(10, 6)
+#  total_tokens              :integer
+#  created_at                :datetime         not null
+#  updated_at                :datetime         not null
+#  response_id               :string
+#  source_id                 :bigint
+#
+# Indexes
+#
+#  index_raif_model_completions_on_completed_at  (completed_at)
+#  index_raif_model_completions_on_created_at    (created_at)
+#  index_raif_model_completions_on_failed_at     (failed_at)
+#  index_raif_model_completions_on_source        (source_type,source_id)
+#  index_raif_model_completions_on_started_at    (started_at)
+#
 class Raif::ModelCompletion < Raif::ApplicationRecord
   include Raif::Concerns::LlmResponseParsing
   include Raif::Concerns::HasAvailableModelTools
+  include Raif::Concerns::BooleanTimestamp
+  boolean_timestamp :started_at
+  boolean_timestamp :completed_at
+  boolean_timestamp :failed_at
   belongs_to :source, polymorphic: true, optional: true
   validates :llm_model_key, presence: true, inclusion: { in: ->{ Raif.available_llm_keys.map(&:to_s) } }
   validates :model_api_name, presence: true
+  # Scope to find completions that have response tool calls
+  scope :with_response_tool_calls, -> { where_json_not_blank(:response_tool_calls) }
   delegate :json_response_schema, to: :source, allow_nil: true
   before_save :set_total_tokens
@@ -41,6 +95,13 @@ class Raif::ModelCompletion < Raif::ApplicationRecord
     end
   end
+  def record_failure!(exception)
+    self.failed_at = Time.current
+    self.failure_error = exception.class.name
+    self.failure_reason = exception.message.truncate(255)
+    save!
+  end
 private
   def llm_config

data/app/models/raif/model_tool.rb CHANGED Viewed

@@ -3,7 +3,7 @@
 class Raif::ModelTool
   include Raif::Concerns::JsonSchemaDefinition
-  delegate :tool_name, :tool_description, :tool_arguments_schema, :example_model_invocation, to: :class
+  delegate :tool_name, :tool_description, :example_model_invocation, to: :class
   class << self
     # The description of the tool that will be provided to the model
@@ -76,8 +76,9 @@ class Raif::ModelTool
       false
     end
-    def invoke_tool(tool_arguments:, source:)
+    def invoke_tool(provider_tool_call_id:, tool_arguments:, source:)
       tool_invocation = Raif::ModelToolInvocation.new(
+        provider_tool_call_id: provider_tool_call_id,
         source: source,
         tool_type: name,
         tool_arguments: tool_arguments
@@ -96,4 +97,11 @@ class Raif::ModelTool
     end
   end
+  # Instance method to get the tool arguments schema
+  # For instance-dependent schemas, builds the schema with this instance as context
+  # For class-level schemas, returns the class-level schema
+  def tool_arguments_schema
+    schema_for_instance(:tool_arguments)
+  end
 end

data/app/models/raif/model_tool_invocation.rb CHANGED Viewed

@@ -1,5 +1,25 @@
 # frozen_string_literal: true
+# == Schema Information
+#
+# Table name: raif_model_tool_invocations
+#
+#  id                    :bigint           not null, primary key
+#  completed_at          :datetime
+#  failed_at             :datetime
+#  result                :jsonb            not null
+#  source_type           :string           not null
+#  tool_arguments        :jsonb            not null
+#  tool_type             :string           not null
+#  created_at            :datetime         not null
+#  updated_at            :datetime         not null
+#  provider_tool_call_id :string
+#  source_id             :bigint           not null
+#
+# Indexes
+#
+#  index_raif_model_tool_invocations_on_source  (source_type,source_id)
+#
 class Raif::ModelToolInvocation < Raif::ApplicationRecord
   belongs_to :source, polymorphic: true
@@ -22,14 +42,26 @@ class Raif::ModelToolInvocation < Raif::ApplicationRecord
     @tool ||= tool_type.constantize
   end
-  def as_llm_message
-    "Invoking tool: #{tool_name} with arguments: #{tool_arguments.to_json}"
+  # Returns tool call in the format expected by LLM message formatting
+  # @param assistant_message [String, nil] Optional assistant message accompanying the tool call
+  # @return [Hash] Hash representation for JSONB storage and LLM APIs
+  def as_tool_call_message(assistant_message: nil)
+    Raif::Messages::ToolCall.new(
+      provider_tool_call_id: provider_tool_call_id,
+      name: tool_name,
+      arguments: tool_arguments,
+      assistant_message: assistant_message
+    ).to_h
   end
-  def result_llm_message
-    return unless tool.respond_to?(:observation_for_invocation)
-    tool.observation_for_invocation(self)
+  # Returns tool result in the format expected by LLM message formatting
+  # @return [Hash] Hash representation for JSONB storage and LLM APIs
+  def as_tool_call_result_message
+    Raif::Messages::ToolCallResult.new(
+      provider_tool_call_id: provider_tool_call_id,
+      name: tool_name,
+      result: result
+    ).to_h
   end
   def to_partial_path

data/app/models/raif/model_tools/agent_final_answer.rb CHANGED Viewed

@@ -20,16 +20,11 @@ class Raif::ModelTools::AgentFinalAnswer < Raif::ModelTool
     def observation_for_invocation(tool_invocation)
       return "No answer provided" unless tool_invocation.result.present?
-      tool_invocation.result["final_answer"]
+      tool_invocation.result
     end
     def process_invocation(tool_invocation)
-      tool_invocation.update!(
-        result: {
-          final_answer: tool_invocation.tool_arguments["final_answer"]
-        }
-      )
+      tool_invocation.update!(result: tool_invocation.tool_arguments["final_answer"])
       tool_invocation.result
     end
   end

data/app/models/raif/model_tools/provider_managed/code_execution.rb CHANGED Viewed

@@ -2,4 +2,8 @@
 class Raif::ModelTools::ProviderManaged::CodeExecution < Raif::ModelTools::ProviderManaged::Base
+  tool_description do
+    "Utilizes the model provider's built-in code execution capabilities."
+  end
 end

data/app/models/raif/model_tools/provider_managed/image_generation.rb CHANGED Viewed

@@ -2,4 +2,8 @@
 class Raif::ModelTools::ProviderManaged::ImageGeneration < Raif::ModelTools::ProviderManaged::Base
+  tool_description do
+    "Utilizes the model provider's built-in image generation capabilities."
+  end
 end

data/app/models/raif/model_tools/provider_managed/web_search.rb CHANGED Viewed

@@ -2,4 +2,8 @@
 class Raif::ModelTools::ProviderManaged::WebSearch < Raif::ModelTools::ProviderManaged::Base
+  tool_description do
+    "Utilizes the model provider's built-in web search capabilities."
+  end
 end