RubyGems - boxcars - Versions diffs - 0.7.7 → 0.8.0 - Mend

boxcars 0.7.7 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

checksums.yaml +4 -4
data/.rubocop.yml +6 -3
data/.ruby-version +1 -1
data/Gemfile +3 -13
data/Gemfile.lock +29 -25
data/POSTHOG_TEST_README.md +118 -0
data/README.md +305 -0
data/boxcars.gemspec +1 -2
data/lib/boxcars/boxcar/active_record.rb +9 -10
data/lib/boxcars/boxcar/calculator.rb +2 -2
data/lib/boxcars/boxcar/engine_boxcar.rb +4 -4
data/lib/boxcars/boxcar/google_search.rb +2 -2
data/lib/boxcars/boxcar/json_engine_boxcar.rb +1 -1
data/lib/boxcars/boxcar/ruby_calculator.rb +1 -1
data/lib/boxcars/boxcar/sql_base.rb +4 -4
data/lib/boxcars/boxcar/swagger.rb +3 -3
data/lib/boxcars/boxcar/vector_answer.rb +3 -3
data/lib/boxcars/boxcar/xml_engine_boxcar.rb +1 -1
data/lib/boxcars/boxcar.rb +6 -6
data/lib/boxcars/conversation_prompt.rb +3 -3
data/lib/boxcars/engine/anthropic.rb +121 -23
data/lib/boxcars/engine/cerebras.rb +2 -2
data/lib/boxcars/engine/cohere.rb +135 -9
data/lib/boxcars/engine/gemini_ai.rb +151 -76
data/lib/boxcars/engine/google.rb +2 -2
data/lib/boxcars/engine/gpt4all_eng.rb +92 -34
data/lib/boxcars/engine/groq.rb +124 -73
data/lib/boxcars/engine/intelligence_base.rb +52 -17
data/lib/boxcars/engine/ollama.rb +127 -47
data/lib/boxcars/engine/openai.rb +186 -103
data/lib/boxcars/engine/perplexityai.rb +116 -136
data/lib/boxcars/engine/together.rb +2 -2
data/lib/boxcars/engine/unified_observability.rb +430 -0
data/lib/boxcars/engine.rb +4 -3
data/lib/boxcars/engines.rb +74 -0
data/lib/boxcars/observability.rb +44 -0
data/lib/boxcars/observability_backend.rb +17 -0
data/lib/boxcars/observability_backends/multi_backend.rb +42 -0
data/lib/boxcars/observability_backends/posthog_backend.rb +89 -0
data/lib/boxcars/observation.rb +8 -8
data/lib/boxcars/prompt.rb +16 -4
data/lib/boxcars/result.rb +7 -12
data/lib/boxcars/ruby_repl.rb +1 -1
data/lib/boxcars/train/train_action.rb +1 -1
data/lib/boxcars/train/xml_train.rb +3 -3
data/lib/boxcars/train/xml_zero_shot.rb +1 -1
data/lib/boxcars/train/zero_shot.rb +3 -3
data/lib/boxcars/train.rb +1 -1
data/lib/boxcars/vector_search.rb +5 -5
data/lib/boxcars/vector_store/pgvector/build_from_array.rb +116 -88
data/lib/boxcars/vector_store/pgvector/build_from_files.rb +106 -80
data/lib/boxcars/vector_store/pgvector/save_to_database.rb +148 -122
data/lib/boxcars/vector_store/pgvector/search.rb +157 -131
data/lib/boxcars/vector_store.rb +4 -4
data/lib/boxcars/version.rb +1 -1
data/lib/boxcars.rb +31 -20
metadata +11 -21

data/lib/boxcars/engine/cohere.rb CHANGED Viewed

@@ -4,6 +4,7 @@
 module Boxcars
   # A engine that uses Cohere's API.
   class Cohere < Engine
+    include UnifiedObservability
     attr_reader :prompts, :llm_params, :model_kwargs, :batch_size
     # The default parameters to use when asking the engine.
@@ -29,7 +30,7 @@ module Boxcars
       @llm_params = DEFAULT_PARAMS.merge(kwargs)
       @prompts = prompts
       @batch_size = 20
-      super(description: description, name: name)
+      super(description:, name:)
     end
     def conversation_model?(_model)
@@ -59,20 +60,45 @@ module Boxcars
     #   Defaults to Boxcars.configuration.cohere_api_key.
     # @param kwargs [Hash] Additional parameters to pass to the engine if wanted.
     def client(prompt:, inputs: {}, **kwargs)
-      api_key = Boxcars.configuration.cohere_api_key(**kwargs)
-      params = prompt.as_prompt(inputs: inputs, prefixes: default_prefixes, show_roles: true).merge(llm_params.merge(kwargs))
-      params[:message] = params.delete(:prompt)
-      params[:stop_sequences] = params.delete(:stop) if params.key?(:stop)
-      Boxcars.debug("Prompt after formatting:#{params[:message]}", :cyan) if Boxcars.configuration.log_prompts
-      chat(params, api_key)
+      start_time = Time.now
+      response_data = { response_obj: nil, parsed_json: nil, success: false, error: nil, status_code: nil }
+      current_params = llm_params.merge(kwargs)
+      current_prompt_object = prompt.is_a?(Array) ? prompt.first : prompt
+      api_request_params = nil
+      begin
+        api_key = Boxcars.configuration.cohere_api_key(**kwargs)
+        api_request_params = current_prompt_object.as_prompt(inputs:, prefixes: default_prefixes,
+                                                             show_roles: true).merge(current_params)
+        api_request_params[:message] = api_request_params.delete(:prompt)
+        api_request_params[:stop_sequences] = api_request_params.delete(:stop) if api_request_params.key?(:stop)
+        Boxcars.debug("Prompt after formatting:#{api_request_params[:message]}", :cyan) if Boxcars.configuration.log_prompts
+        raw_response = _cohere_api_call(api_request_params, api_key)
+        _process_cohere_response(raw_response, response_data)
+      rescue StandardError => e
+        _handle_cohere_error(e, response_data)
+      ensure
+        call_context = {
+          start_time:,
+          prompt_object: current_prompt_object,
+          inputs:,
+          api_request_params:,
+          current_params:
+        }
+        _track_cohere_observability(call_context, response_data)
+      end
+      _cohere_handle_call_outcome(response_data:)
     end
     # get an answer from the engine for a question.
     # @param question [String] The question to ask the engine.
     # @param kwargs [Hash] Additional parameters to pass to the engine if wanted.
-    def run(question, **kwargs)
+    def run(question, **)
       prompt = Prompt.new(template: question)
-      response = client(prompt: prompt, **kwargs)
+      response = client(prompt:, **)
       raise Error, "Cohere: No response from API" unless response
       raise Error, "Cohere: #{response[:error]}" if response[:error]
@@ -131,5 +157,105 @@ module Boxcars
     def default_prefixes
       { system: "SYSTEM: ", user: "USER: ", assistant: "CHATBOT: ", history: :history }
     end
+    private
+    # Make the actual API call to Cohere
+    def _cohere_api_call(params, api_key)
+      raise Boxcars::Error, 'Cohere API key not set' if api_key.blank?
+      # Define the API endpoint and parameters
+      api_endpoint = 'https://api.cohere.ai/v1/chat'
+      connection = Faraday.new(api_endpoint) do |faraday|
+        faraday.request :url_encoded
+        faraday.headers['Authorization'] = "Bearer #{api_key}"
+        faraday.headers['Content-Type'] = 'application/json'
+      end
+      # Make the API call
+      connection.post { |req| req.body = params.to_json }
+    end
+    # Process the raw response from Cohere API
+    def _process_cohere_response(raw_response, response_data)
+      response_data[:response_obj] = raw_response
+      response_data[:status_code] = raw_response.status
+      if raw_response.status == 200
+        parsed_json = JSON.parse(raw_response.body, symbolize_names: true)
+        response_data[:parsed_json] = parsed_json
+        if parsed_json[:error]
+          response_data[:success] = false
+          response_data[:error] = Boxcars::Error.new("Cohere API Error: #{parsed_json[:error]}")
+        else
+          response_data[:success] = true
+        end
+      else
+        response_data[:success] = false
+        response_data[:error] = Boxcars::Error.new("HTTP #{raw_response.status}: #{raw_response.reason_phrase}")
+      end
+    end
+    # Handle errors from Cohere API calls
+    def _handle_cohere_error(error, response_data)
+      response_data[:error] = error
+      response_data[:success] = false
+      response_data[:status_code] = error.respond_to?(:response) && error.response ? error.response[:status] : nil
+    end
+    # Track observability using the unified system
+    def _track_cohere_observability(call_context, response_data)
+      duration_ms = ((Time.now - call_context[:start_time]) * 1000).round
+      request_context = {
+        prompt: call_context[:prompt_object],
+        inputs: call_context[:inputs],
+        conversation_for_api: call_context[:api_request_params]
+      }
+      track_ai_generation(
+        duration_ms:,
+        current_params: call_context[:current_params],
+        request_context:,
+        response_data:,
+        provider: :cohere
+      )
+    end
+    # Handle the final outcome of the API call
+    def _cohere_handle_call_outcome(response_data:)
+      if response_data[:error]
+        _handle_cohere_error_outcome(response_data[:error])
+      elsif !response_data[:success]
+        _handle_cohere_response_body_error(response_data[:response_obj])
+      else
+        response_data[:parsed_json] # Return the raw parsed JSON
+      end
+    end
+    # Handle error outcomes
+    def _handle_cohere_error_outcome(error_data)
+      detailed_error_message = error_data.message
+      if error_data.respond_to?(:response) && error_data.response
+        detailed_error_message += " - Details: #{error_data.response[:body]}"
+      end
+      Boxcars.error("Cohere Error: #{detailed_error_message} (#{error_data.class.name})", :red)
+      raise error_data
+    end
+    # Handle response body errors
+    def _handle_cohere_response_body_error(response_obj)
+      msg = "Unknown error from Cohere API"
+      if response_obj.respond_to?(:body)
+        begin
+          parsed_body = JSON.parse(response_obj.body)
+          msg = parsed_body["message"] || parsed_body["error"] || msg
+        rescue JSON::ParserError
+          msg = "HTTP #{response_obj.status}: #{response_obj.reason_phrase}"
+        end
+      end
+      raise Error, msg
+    end
   end
 end

data/lib/boxcars/engine/gemini_ai.rb CHANGED Viewed

@@ -1,118 +1,193 @@
 # frozen_string_literal: true
-# Boxcars is a framework for running a series of tools to get an answer to a question.
+require 'openai' # Gemini uses the OpenAI gem with a custom URI base
+require 'json'
 module Boxcars
-  # A engine that uses GeminiAI's API.
+  # A engine that uses GeminiAI's API via an OpenAI-compatible interface.
   class GeminiAi < Engine
-    attr_reader :prompts, :llm_parmas, :model_kwargs, :batch_size
+    include UnifiedObservability
+    attr_reader :prompts, :llm_params, :model_kwargs, :batch_size # Corrected typo llm_parmas to llm_params
-    # The default parameters to use when asking the engine.
     DEFAULT_PARAMS = {
-      model: "gemini-1.5-flash-latest",
+      model: "gemini-1.5-flash-latest", # Default model for Gemini
       temperature: 0.1
+      # max_tokens is often part of the request, not a fixed default here
     }.freeze
-    # the default name of the engine
     DEFAULT_NAME = "GeminiAI engine"
-    # the default description of the engine
-    DEFAULT_DESCRIPTION = "useful for when you need to use AI to answer questions. " \
+    DEFAULT_DESCRIPTION = "useful for when you need to use Gemini AI to answer questions. " \
                           "You should ask targeted questions"
-    # A engine is a container for a single tool to run.
-    # @param name [String] The name of the engine. Defaults to "GeminiAI engine".
-    # @param description [String] A description of the engine. Defaults to:
-    #        useful for when you need to use AI to answer questions. You should ask targeted questions".
-    # @param prompts [Array<String>] The prompts to use when asking the engine. Defaults to [].
-    # @param batch_size [Integer] The number of prompts to send to the engine at once. Defaults to 20.
     def initialize(name: DEFAULT_NAME, description: DEFAULT_DESCRIPTION, prompts: [], batch_size: 20, **kwargs)
-      @llm_parmas = DEFAULT_PARAMS.merge(kwargs)
+      @llm_params = DEFAULT_PARAMS.merge(kwargs) # Corrected typo here
       @prompts = prompts
       @batch_size = batch_size
-      super(description: description, name: name)
+      super(description:, name:)
     end
-    # Get the OpenAI API client
-    # @param gemini_api_key [String] The access token to use when asking the engine.
-    #   Defaults to Boxcars.configuration.gemini_api_key
-    # @return [OpenAI::Client] The OpenAI API gem client.
-    def self.open_ai_client(gemini_api_key: nil)
-      access_token = Boxcars.configuration.gemini_api_key(gemini_api_key: gemini_api_key)
-      ::OpenAI::Client.new(access_token: access_token, uri_base: "https://generativelanguage.googleapis.com/v1beta/openai/")
+    # Renamed from open_ai_client to gemini_client for clarity
+    def self.gemini_client(gemini_api_key: nil)
+      access_token = Boxcars.configuration.gemini_api_key(gemini_api_key:)
+      # NOTE: The OpenAI gem might not support `log_errors: true` for custom uri_base.
+      # It's a param for OpenAI::Client specific to their setup.
+      ::OpenAI::Client.new(access_token:, uri_base: "https://generativelanguage.googleapis.com/v1beta/")
+      # Removed /openai from uri_base as it's usually for OpenAI-specific paths on custom domains.
+      # The Gemini endpoint might be directly at /v1beta/models/gemini...:generateContent
+      # This might need adjustment based on how the OpenAI gem forms the full URL.
+      # For direct generateContent, a different client or HTTP call might be needed if OpenAI gem is too restrictive.
+      # Assuming for now it's an OpenAI-compatible chat endpoint.
     end
-    def conversation_model?(_model)
+    # Gemini models are typically conversational.
+    def conversation_model?(_model_name)
       true
     end
-    # Get an answer from the engine.
-    # @param prompt [String] The prompt to use when asking the engine.
-    # @param gemini_api_key [String] The access token to use when asking the engine.
-    #   Defaults to Boxcars.configuration.gemini_api_key.
-    # @param kwargs [Hash] Additional parameters to pass to the engine if wanted.
     def client(prompt:, inputs: {}, gemini_api_key: nil, **kwargs)
-      clnt = GeminiAi.open_ai_client(gemini_api_key: gemini_api_key)
-      params = llm_parmas.merge(kwargs)
-      prompt = prompt.first if prompt.is_a?(Array)
-      params = prompt.as_messages(inputs).merge(params)
-      if Boxcars.configuration.log_prompts
-        Boxcars.debug(params[:messages].last(2).map { |p| ">>>>>> Role: #{p[:role]} <<<<<<\n#{p[:content]}" }.join("\n"), :cyan)
+      start_time = Time.now
+      response_data = { response_obj: nil, parsed_json: nil, success: false, error: nil, status_code: nil }
+      current_params = @llm_params.merge(kwargs) # Use instance var @llm_params
+      api_request_params = nil
+      current_prompt_object = prompt.is_a?(Array) ? prompt.first : prompt
+      begin
+        clnt = GeminiAi.gemini_client(gemini_api_key:)
+        api_request_params = _prepare_gemini_request_params(current_prompt_object, inputs, current_params)
+        log_messages_debug(api_request_params[:messages]) if Boxcars.configuration.log_prompts && api_request_params[:messages]
+        _execute_and_process_gemini_call(clnt, api_request_params, response_data)
+      rescue ::OpenAI::Error => e # Catch OpenAI gem errors if they apply
+        response_data[:error] = e
+        response_data[:success] = false
+        response_data[:status_code] = e.http_status if e.respond_to?(:http_status)
+      rescue StandardError => e # Catch other errors
+        response_data[:error] = e
+        response_data[:success] = false
+      ensure
+        duration_ms = ((Time.now - start_time) * 1000).round
+        request_context = {
+          prompt: current_prompt_object,
+          inputs:,
+          conversation_for_api: api_request_params&.dig(:messages) || []
+        }
+        track_ai_generation(
+          duration_ms:,
+          current_params:,
+          request_context:,
+          response_data:,
+          provider: :gemini
+        )
       end
-      clnt.chat(parameters: params)
-    rescue => e
-      Boxcars.error(e, :red)
-      raise
+      _gemini_handle_call_outcome(response_data:)
     end
-    # get an answer from the engine for a question.
-    # @param question [String] The question to ask the engine.
-    # @param kwargs [Hash] Additional parameters to pass to the engine if wanted.
-    def run(question, **kwargs)
+    def run(question, **)
       prompt = Prompt.new(template: question)
-      response = client(prompt: prompt, **kwargs)
-      raise Error, "GeminiAI: No response from API" unless response
-      check_response(response)
-      response["choices"].map { |c| c.dig("message", "content") || c["text"] }.join("\n").strip
+      answer = client(prompt:, inputs: {}, **)
+      Boxcars.debug("Answer: #{answer}", :cyan)
+      answer
     end
-    # Get the default parameters for the engine.
     def default_params
-      llm_params
+      @llm_params # Use instance variable
     end
-    # make sure we got a valid response
-    # @param response [Hash] The response to check.
-    # @param must_haves [Array<String>] The keys that must be in the response. Defaults to %w[choices].
-    # @raise [KeyError] if there is an issue with the access token.
-    # @raise [ValueError] if the response is not valid.
-    def check_response(response, must_haves: %w[choices])
-      if response['error'].is_a?(Hash)
-        code = response.dig('error', 'code')
-        msg = response.dig('error', 'message') || 'unknown error'
-        raise KeyError, "GEMINI_API_TOKEN not valid" if code == 'invalid_api_key'
-        raise ValueError, "GeminiAI error: #{msg}"
+    private
+    def _execute_and_process_gemini_call(gemini_client_obj, prepared_api_params, current_response_data)
+      # The OpenAI gem's `chat` method might not work directly if Gemini's endpoint
+      # isn't perfectly OpenAI-compatible for chat completions.
+      # It might require calling a different method or using a more direct HTTP client.
+      # For this refactor, we'll assume `gemini_client_obj.chat` is the intended path.
+      raw_response = gemini_client_obj.chat(parameters: prepared_api_params)
+      current_response_data[:response_obj] = raw_response
+      current_response_data[:parsed_json] = raw_response # OpenAI gem returns Hash
+      if raw_response && !raw_response["error"] &&
+         (raw_response["choices"] || raw_response["candidates"]) # Combined check for OpenAI or Gemini success
+        current_response_data[:success] = true
+        current_response_data[:status_code] = 200 # Inferred
+      else
+        current_response_data[:success] = false
+        err_details = raw_response["error"] if raw_response
+        msg = if err_details
+                (err_details.is_a?(Hash) ? err_details['message'] : err_details).to_s
+              else
+                "Unknown Gemini API Error"
+              end
+        current_response_data[:error] = StandardError.new(msg)
       end
+    end
+    def _prepare_gemini_request_params(current_prompt, current_inputs, current_engine_params)
+      # Gemini typically uses a chat-like interface.
+      # Prepare messages for the API
+      # current_prompt.as_messages(current_inputs) returns a hash like { messages: [...] }
+      # We need to extract the array part for the OpenAI client's :messages parameter.
+      message_hash = current_prompt.as_messages(current_inputs)
+      # Ensure roles are 'user' and 'model' for Gemini if needed, or transform them.
+      # OpenAI gem expects 'system', 'user', 'assistant'. Adapter logic might be needed.
+      # For now, assume as_messages produces compatible roles or Gemini endpoint handles them.
+      # Gemini might not use 'model' in the same way in request body if using generateContent directly.
+      # If using OpenAI gem's chat method, it expects 'model' for routing.
+      # Let's assume api_request_params are for OpenAI gem's chat method.
+      { messages: message_hash[:messages] }.merge(current_engine_params)
+    end
+    def log_messages_debug(messages)
+      return unless messages.is_a?(Array)
+      Boxcars.debug(messages.last(2).map { |p| ">>>>>> Role: #{p[:role]} <<<<<<\n#{p[:content]}" }.join("\n"), :cyan)
+    end
-      must_haves.each do |key|
-        raise ValueError, "Expecting key #{key} in response" unless response.key?(key)
+    def _gemini_handle_call_outcome(response_data:)
+      if response_data[:error]
+        Boxcars.error("GeminiAI Error: #{response_data[:error].message} (#{response_data[:error].class.name})", :red)
+        raise response_data[:error]
+      elsif !response_data[:success]
+        err_details = response_data.dig(:response_obj, "error")
+        msg = if err_details
+                err_details.is_a?(Hash) ? "#{err_details['type']}: #{err_details['message']}" : err_details.to_s
+              else
+                "Unknown error from GeminiAI API"
+              end
+        raise Error, msg
+      else
+        _extract_content_from_gemini_response(response_data[:parsed_json])
       end
     end
-    # the engine type
-    def engine_type
-      "gemini_ai"
+    def _extract_content_from_gemini_response(parsed_json)
+      # Handle Gemini's specific response structure (candidates)
+      # or OpenAI-compatible structure if the endpoint behaves that way.
+      if parsed_json&.key?("candidates") # Native Gemini generateContent response
+        parsed_json["candidates"].map { |c| c.dig("content", "parts", 0, "text") }.join("\n").strip
+      elsif parsed_json&.key?("choices") # OpenAI-compatible response
+        parsed_json["choices"].map { |c| c.dig("message", "content") || c["text"] }.join("\n").strip
+      else
+        raise Error, "GeminiAI: Could not extract answer from response"
+      end
     end
-    # Calculate the maximum number of tokens possible to generate for a prompt.
-    # @param prompt_text [String] The prompt text to use.
-    # @return [Integer] the number of tokens possible to generate.
-    def max_tokens_for_prompt(prompt_text)
-      num_tokens = get_num_tokens(prompt_text)
+    # check_response method might be partially covered by _gemini_handle_call_outcome
+    # Retaining it if run method still uses it explicitly.
+    def check_response(response, must_haves: %w[choices candidates])
+      if response['error'].is_a?(Hash)
+        code = response.dig('error', 'code')
+        msg = response.dig('error', 'message') || 'unknown error'
+        # GEMINI_API_TOKEN is not standard, usually it's an API key.
+        # This check might need to align with actual error codes from Gemini.
+        raise KeyError, "Gemini API Key not valid or permission issue" if ['invalid_api_key', 'permission_denied'].include?(code)
+        raise ValueError, "GeminiAI error: #{msg}"
+      end
-      # get max context size for model by name
-      max_size = 8096
-      max_size - num_tokens
+      # Check for either 'choices' (OpenAI style) or 'candidates' (Gemini native style)
+      has_valid_content = must_haves.any? { |key| response.key?(key) && !response[key].empty? }
+      raise ValueError, "Expecting key like 'choices' or 'candidates' in response" unless has_valid_content
     end
   end
 end

data/lib/boxcars/engine/google.rb CHANGED Viewed

@@ -21,8 +21,8 @@ module Boxcars
     # @param prompts [Array<Prompt>] The prompts to use for the Engine.
     # @param batch_size [Integer] The number of prompts to send to the Engine at a time.
     # @param kwargs [Hash] Additional parameters to pass to the Engine.
-    def initialize(name: DEFAULT_NAME, description: DEFAULT_DESCRIPTION, prompts: [], batch_size: 20, **kwargs)
-      super(provider: :google, description: description, name: name, prompts: prompts, batch_size: batch_size, **kwargs)
+    def initialize(name: DEFAULT_NAME, description: DEFAULT_DESCRIPTION, prompts: [], batch_size: 20, **)
+      super(provider: :google, description:, name:, prompts:, batch_size:, **)
     end
     def default_model_params

data/lib/boxcars/engine/gpt4all_eng.rb CHANGED Viewed

@@ -1,56 +1,114 @@
 # frozen_string_literal: true
 require 'gpt4all'
-# Boxcars is a framework for running a series of tools to get an answer to a question.
+require 'json' # For pretty_generate
 module Boxcars
   # A engine that uses local GPT4All API.
   class Gpt4allEng < Engine
-    attr_reader :prompts, :model_kwargs, :batch_size
+    include UnifiedObservability
+    attr_reader :prompts, :model_kwargs, :batch_size, :gpt4all_params # Added gpt4all_params
-    # the default name of the engine
     DEFAULT_NAME = "Gpt4all engine"
-    # the default description of the engine
     DEFAULT_DESCRIPTION = "useful for when you need to use local AI to answer questions. " \
                           "You should ask targeted questions"
+    # GPT4All doesn't have typical API params like temperature or model selection via params in the same way.
+    # Model is usually pre-loaded. We can add a placeholder for model_name if needed for tracking.
+    DEFAULT_PARAMS = {
+      model_name: "gpt4all-j-v1.3-groovy" # Example, actual model depends on local setup
+    }.freeze
-    # A engine is a container for a single tool to run.
-    # @param name [String] The name of the engine. Defaults to "OpenAI engine".
-    # @param description [String] A description of the engine. Defaults to:
-    #        useful for when you need to use AI to answer questions. You should ask targeted questions".
-    # @param prompts [Array<String>] The prompts to use when asking the engine. Defaults to [].
-    # @param batch_size [Integer] The number of prompts to send to the engine at once. Defaults to 2.
-    def initialize(name: DEFAULT_NAME, description: DEFAULT_DESCRIPTION, prompts: [], batch_size: 2, **_kwargs)
+    def initialize(name: DEFAULT_NAME, description: DEFAULT_DESCRIPTION, prompts: [], batch_size: 2, **kwargs)
+      @gpt4all_params = DEFAULT_PARAMS.merge(kwargs) # Store merged params
       @prompts = prompts
-      @batch_size = batch_size
-      super(description: description, name: name)
+      @batch_size = batch_size # Retain if used by other methods
+      super(description:, name:)
     end
-    # Get an answer from the engine.
-    # @param prompt [String] The prompt to use when asking the engine.
-    # @param openai_access_token [String] The access token to use when asking the engine.
-    #   Defaults to Boxcars.configuration.openai_access_token.
-    # @param kwargs [Hash] Additional parameters to pass to the engine if wanted.
-    def client(prompt:, inputs: {}, **_kwargs)
-      gpt4all = Gpt4all::ConversationalAI.new
-      gpt4all.prepare_resources(force_download: false)
-      gpt4all.start_bot
-      input_text = prompt.as_prompt(inputs: inputs)[:prompt]
-      Boxcars.debug("Prompt after formatting:\n#{input_text}", :cyan) if Boxcars.configuration.log_prompts
-      gpt4all.prompt(input_text)
-    rescue StandardError => e
-      Boxcars.error(["Error from gpt4all engine: #{e}", e.backtrace[-5..-1]].flatten.join("\n   "))
-    ensure
-      gpt4all.stop_bot
+    def client(prompt:, inputs: {}, **kwargs)
+      start_time = Time.now
+      response_data = { response_obj: nil, parsed_json: nil, success: false, error: nil, status_code: nil }
+      # current_params are the effective parameters for this call, including defaults and overrides
+      current_params = @gpt4all_params.merge(kwargs)
+      # api_request_params for GPT4All is just the input text.
+      api_request_params = nil
+      current_prompt_object = prompt.is_a?(Array) ? prompt.first : prompt
+      gpt4all_instance = nil # To ensure it's in scope for ensure block
+      begin
+        gpt4all_instance = Gpt4all::ConversationalAI.new
+        # prepare_resources might download models, could take time.
+        # Consider if this setup should be outside the timed/tracked client call for long-running setup.
+        # For now, including it as it's part of the interaction.
+        gpt4all_instance.prepare_resources(force_download: false)
+        gpt4all_instance.start_bot
+        # GPT4All gem's prompt method takes a string.
+        prompt_text_for_api = current_prompt_object.as_prompt(inputs:)
+        prompt_text_for_api = prompt_text_for_api[:prompt] if prompt_text_for_api.is_a?(Hash) && prompt_text_for_api.key?(:prompt)
+        api_request_params = { prompt: prompt_text_for_api } # Store what's sent
+        Boxcars.debug("Prompt after formatting:\n#{prompt_text_for_api}", :cyan) if Boxcars.configuration.log_prompts
+        raw_response_text = gpt4all_instance.prompt(prompt_text_for_api) # Actual call
+        # GPT4All gem returns a string directly, or raises error.
+        response_data[:response_obj] = raw_response_text # Store the raw string
+        response_data[:parsed_json] = { "text" => raw_response_text } # Create a simple hash for consistency
+        response_data[:success] = true
+        response_data[:status_code] = 200 # Inferred for local success
+      rescue StandardError => e
+        response_data[:error] = e
+        response_data[:success] = false
+        # No HTTP status code for local errors typically, unless the gem provides one.
+      ensure
+        gpt4all_instance&.stop_bot # Ensure bot is stopped even if errors occur
+        duration_ms = ((Time.now - start_time) * 1000).round
+        request_context = {
+          prompt: current_prompt_object,
+          inputs:,
+          conversation_for_api: api_request_params&.dig(:prompt) # The text prompt
+        }
+        track_ai_generation(
+          duration_ms:,
+          current_params:,
+          request_context:,
+          response_data:,
+          provider: :gpt4all
+        )
+      end
+      _gpt4all_handle_call_outcome(response_data:)
     end
-    # get an answer from the engine for a question.
-    # @param question [String] The question to ask the engine.
-    # @param kwargs [Hash] Additional parameters to pass to the engine if wanted.
-    def run(question, **kwargs)
+    def run(question, **)
       prompt = Prompt.new(template: question)
-      answer = client(prompt: prompt, **kwargs)
+      answer = client(prompt:, inputs: {}, **)
       Boxcars.debug("Answer: #{answer}", :cyan)
       answer
     end
+    # Added for consistency
+    def default_params
+      @gpt4all_params
+    end
+    private
+    def _gpt4all_handle_call_outcome(response_data:)
+      if response_data[:error]
+        # The original code had a specific error logging format.
+        Boxcars.error(["Error from gpt4all engine: #{response_data[:error].message}",
+                       response_data[:error].backtrace&.first(5)&.join("\n   ")].compact.join("\n   "), :red)
+        raise response_data[:error]
+      elsif !response_data[:success]
+        # This case might be redundant if gpt4all gem always raises on error
+        raise Error, "Unknown error from Gpt4all"
+      else
+        response_data.dig(:parsed_json, "text") # Extract the text from our structured hash
+      end
+    end
   end
 end