RubyGems - scout-ai - Versions diffs - 0.2.0 → 1.0.0 - Mend

scout-ai 0.2.0 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (80) hide show

checksums.yaml +4 -4
data/.vimproject +91 -10
data/Rakefile +1 -0
data/VERSION +1 -1
data/bin/scout-ai +2 -0
data/lib/scout/llm/agent/chat.rb +24 -0
data/lib/scout/llm/agent.rb +13 -13
data/lib/scout/llm/ask.rb +26 -16
data/lib/scout/llm/backends/bedrock.rb +129 -0
data/lib/scout/llm/backends/huggingface.rb +6 -21
data/lib/scout/llm/backends/ollama.rb +69 -36
data/lib/scout/llm/backends/openai.rb +85 -35
data/lib/scout/llm/backends/openwebui.rb +1 -1
data/lib/scout/llm/backends/relay.rb +3 -2
data/lib/scout/llm/backends/responses.rb +272 -0
data/lib/scout/llm/chat.rb +547 -0
data/lib/scout/llm/parse.rb +70 -13
data/lib/scout/llm/tools.rb +126 -5
data/lib/scout/llm/utils.rb +17 -10
data/lib/scout/model/base.rb +19 -0
data/lib/scout/model/python/base.rb +25 -0
data/lib/scout/model/python/huggingface/causal/next_token.rb +23 -0
data/lib/scout/model/python/huggingface/causal.rb +29 -0
data/lib/scout/model/python/huggingface/classification +0 -0
data/lib/scout/model/python/huggingface/classification.rb +50 -0
data/lib/scout/model/python/huggingface.rb +112 -0
data/lib/scout/model/python/torch/dataloader.rb +57 -0
data/lib/scout/model/python/torch/helpers.rb +84 -0
data/lib/scout/model/python/torch/introspection.rb +34 -0
data/lib/scout/model/python/torch/load_and_save.rb +47 -0
data/lib/scout/model/python/torch.rb +94 -0
data/lib/scout/model/util/run.rb +181 -0
data/lib/scout/model/util/save.rb +81 -0
data/lib/scout-ai.rb +3 -1
data/python/scout_ai/__init__.py +35 -0
data/python/scout_ai/__pycache__/__init__.cpython-310.pyc +0 -0
data/python/scout_ai/__pycache__/__init__.cpython-311.pyc +0 -0
data/python/scout_ai/__pycache__/huggingface.cpython-310.pyc +0 -0
data/python/scout_ai/__pycache__/huggingface.cpython-311.pyc +0 -0
data/python/scout_ai/__pycache__/util.cpython-310.pyc +0 -0
data/python/scout_ai/__pycache__/util.cpython-311.pyc +0 -0
data/python/scout_ai/atcold/__init__.py +0 -0
data/python/scout_ai/atcold/plot_lib.py +141 -0
data/python/scout_ai/atcold/spiral.py +27 -0
data/python/scout_ai/huggingface/data.py +48 -0
data/python/scout_ai/huggingface/eval.py +60 -0
data/python/scout_ai/huggingface/model.py +29 -0
data/python/scout_ai/huggingface/rlhf.py +83 -0
data/python/scout_ai/huggingface/train/__init__.py +34 -0
data/python/scout_ai/huggingface/train/__pycache__/__init__.cpython-310.pyc +0 -0
data/python/scout_ai/huggingface/train/__pycache__/next_token.cpython-310.pyc +0 -0
data/python/scout_ai/huggingface/train/next_token.py +315 -0
data/python/scout_ai/language_model.py +70 -0
data/python/scout_ai/util.py +32 -0
data/scout-ai.gemspec +130 -0
data/scout_commands/agent/ask +133 -15
data/scout_commands/agent/kb +15 -0
data/scout_commands/llm/ask +71 -12
data/scout_commands/llm/process +4 -2
data/test/data/cat.jpg +0 -0
data/test/scout/llm/agent/test_chat.rb +14 -0
data/test/scout/llm/backends/test_bedrock.rb +60 -0
data/test/scout/llm/backends/test_huggingface.rb +3 -3
data/test/scout/llm/backends/test_ollama.rb +48 -10
data/test/scout/llm/backends/test_openai.rb +96 -11
data/test/scout/llm/backends/test_responses.rb +115 -0
data/test/scout/llm/test_ask.rb +1 -0
data/test/scout/llm/test_chat.rb +214 -0
data/test/scout/llm/test_parse.rb +81 -2
data/test/scout/model/python/huggingface/causal/test_next_token.rb +59 -0
data/test/scout/model/python/huggingface/test_causal.rb +33 -0
data/test/scout/model/python/huggingface/test_classification.rb +30 -0
data/test/scout/model/python/test_base.rb +44 -0
data/test/scout/model/python/test_huggingface.rb +9 -0
data/test/scout/model/python/test_torch.rb +71 -0
data/test/scout/model/python/torch/test_helpers.rb +14 -0
data/test/scout/model/test_base.rb +117 -0
data/test/scout/model/util/test_save.rb +31 -0
metadata +72 -5
data/questions/coach +0 -2

data/lib/scout/llm/backends/openai.rb CHANGED Viewed

@@ -1,8 +1,6 @@
 require 'scout'
 require 'openai'
-require_relative '../parse'
-require_relative '../tools'
-require_relative '../utils'
+require_relative '../chat'
 module LLM
   module OpenAI
@@ -11,9 +9,44 @@ module LLM
       Object::OpenAI::Client.new(access_token:key, log_errors: log_errors, uri_base: url)
     end
+    def self.process_input(messages)
+      messages.collect do |message|
+        if message[:role] == 'function_call'
+          {role: 'assistant', tool_calls: [message[:content]]}
+        elsif message[:role] == 'function_call_output'
+          message[:content]
+        else
+          message
+        end
+      end.flatten
+    end
+    def self.process_response(response, &block)
+      Log.debug "Respose: #{Log.fingerprint response}"
+      raise Exception, response["error"] if response["error"]
+      message = response.dig("choices", 0, "message")
+      tool_calls = response.dig("choices", 0, "tool_calls") ||
+        response.dig("choices", 0, "message", "tool_calls")
+      if tool_calls && tool_calls.any?
+        LLM.call_tools tool_calls, &block
+      else
+        [message]
+      end
+    end
     def self.ask(question, options = {}, &block)
+      original_options = options.dup
-      client, url, key, model, log_errors = IndiferentHash.process_options options, :client, :url, :key, :model, :log_errors
+      messages = LLM.chat(question)
+      options = options.merge LLM.options messages
+      tools = LLM.tools messages
+      associations = LLM.associations messages
+      client, url, key, model, log_errors, return_messages, format = IndiferentHash.process_options options,
+        :client, :url, :key, :model, :log_errors, :return_messages, :format,
+        log_errors: true
       if client.nil?
         url ||= Scout::Config.get(:url, :openai_ask, :ask, :openai, env: 'OPENAI_URL')
@@ -23,45 +56,62 @@ module LLM
       if model.nil?
         url ||= Scout::Config.get(:url, :openai_ask, :ask, :openai, env: 'OPENAI_URL')
-        model ||= LLM.get_url_config(:model, url, :openai_ask, :ask, :openai, env: 'OPENAI_MODEL', default: "gpt-3.5-turbo")
+        model ||= LLM.get_url_config(:model, url, :openai_ask, :ask, :openai, env: 'OPENAI_MODEL', default: "gpt-4.1")
       end
-      role = IndiferentHash.process_options options, :role
-      messages = LLM.parse(question, role)
-      parameters = options.merge(model: model, messages: messages)
-      Log.debug "Calling client with parameters: #{Log.fingerprint parameters}"
-      response = client.chat(parameters: parameters)
-      Log.debug "Respose: #{Log.fingerprint response}"
-      message = response.dig("choices", 0, "message")
-      tool_calls = response.dig("choices", 0, "tool_calls") ||
-        response.dig("choices", 0, "message", "tool_calls")
+      #role = IndiferentHash.process_options options, :role
+      case format.to_sym
+      when :json, :json_object
+        options[:response_format] = {type: 'json_object'}
+      else
+        options[:response_format] = {type: format}
+      end if format
+      parameters = options.merge(model: model)
+      if tools.any? || associations.any?
+        parameters[:tools] = []
+        parameters[:tools] += tools.values.collect{|a| a.last } if tools
+        parameters[:tools] += associations.values.collect{|a| a.last } if associations
+        if not block_given?
+          block = Proc.new do |name,parameters|
+            IndiferentHash.setup parameters
+            if tools[name]
+              workflow = tools[name].first
+              jobname = parameters.delete :jobname
+              workflow.job(name, jobname, parameters).run
+            else
+              kb = associations[name].first
+              entities, reverse = IndiferentHash.process_options parameters, :entities, :reverse
+              if reverse
+                kb.parents(name, entities)
+              else
+                kb.children(name, entities)
+              end
+            end
+          end
+        end
+      end
-      parameters.delete :tool_choice
+      Log.low "Calling openai #{url}: #{Log.fingerprint parameters}}"
+      Log.debug LLM.print messages
-      while tool_calls && tool_calls.any?
-        messages << message
+      parameters[:messages] = LLM.tools_to_openai messages
-        cpus = Scout::Config.get :cpus, :tool_calling, default: 3
-        tool_calls.each do |tool_call|
-          response_message = LLM.tool_response(tool_call, &block)
-          messages << response_message
-        end
+      response = self.process_response client.chat(parameters: parameters), &block
-        parameters[:messages] = messages.compact
-        Log.debug "Calling client with parameters: #{Log.fingerprint parameters}"
-        response = client.chat( parameters: parameters)
-        Log.debug "Respose: #{Log.fingerprint response}"
+      res = if response.last[:role] == 'function_call_output'
+              response + self.ask(messages + response, original_options.except(:tool_choice).merge(return_messages: true, tools: parameters[:tools]), &block)
+            else
+              response
+            end
-        message = response.dig("choices", 0, "message")
-        tool_calls = response.dig("choices", 0, "tool_calls") ||
-          response.dig("choices", 0, "message", "tool_calls")
+      if return_messages
+        res
+      else
+        res.last['content']
       end
-      message.dig("content")
     end
     def self.embed(text, options = {})

data/lib/scout/llm/backends/openwebui.rb CHANGED Viewed

@@ -31,7 +31,7 @@ module LLM
       model ||= LLM.get_url_config(:model, url, :openai_ask, :ask, :openai, env: 'OPENWEBUI_MODEL')
       role = IndiferentHash.process_options options, :role
-      messages = LLM.parse(question, role)
+      messages = LLM.messages(question, role)
       parameters = options.merge(model: model, messages: messages)

data/lib/scout/llm/backends/relay.rb CHANGED Viewed

@@ -24,9 +24,10 @@ module LLM
     end
     def self.ask(question, options = {}, &block)
-      options[:question] = question
+      server = IndiferentHash.process_options options, :server
+      server ||= Scout::Config.get :server, :ask_relay, :relay, :ask, env: 'ASK_ENDPOINT,LLM_ENDPOINT', default: :openai
-      server = Scout::Config.get(:server, :relay, default: "localhost")
+      options[:question] = question
       TmpFile.with_file(options.to_json) do |file|
         id = upload(server, file)
         gather(server, id)

data/lib/scout/llm/backends/responses.rb ADDED Viewed

@@ -0,0 +1,272 @@
+require_relative 'openai'
+module LLM
+  module Responses
+    def self.encode_image(path)
+      path = path.find if Path === path
+      file_content = File.binread(path)  # Replace with your file name
+      case extension = path.split('.').last.downcase
+      when 'jpg', 'jpeg'
+        mime = "image/jpeg"
+      when 'png'
+        mime = "image/png"
+      else
+        mime = "image/extension"
+      end
+      base64_image = Base64.strict_encode64(file_content)
+      "data:#{mime};base64,#{base64_image}"
+    end
+    def self.encode_pdf(path)
+      file_content = File.binread(path)  # Replace with your file name
+      Base64.strict_encode64(file_content)
+    end
+    def self.tool_response(tool_call, &block)
+      tool_call_id = tool_call.dig("id").sub(/^fc_/, '')
+      function_name = tool_call.dig("function", "name")
+      function_arguments = tool_call.dig("function", "arguments")
+      function_arguments = JSON.parse(function_arguments, { symbolize_names: true }) if String === function_arguments
+      IndiferentHash.setup function_arguments
+      function_response = block.call function_name, function_arguments
+      content = case function_response
+                when nil
+                  "success"
+                else
+                  function_response
+                end
+      content = content.to_s if Numeric === content
+    end
+    def self.tools_to_responses(messages)
+      messages.collect do |message|
+        if message[:role] == 'function_call'
+          info = JSON.parse(message[:content])
+          IndiferentHash.setup info
+          id = info[:id].sub(/^fc_/, '')
+          IndiferentHash.setup({
+            "type" => "function_call",
+            "status" => "completed",
+            "name" => info[:name],
+            "arguments" => (info[:arguments] || {}).to_json,
+            "call_id"=>"call_#{id}",
+          })
+        elsif message[:role] == 'function_call_output'
+          info = JSON.parse(message[:content])
+          IndiferentHash.setup info
+          id = info[:id].sub(/^fc_/, '')
+          {                               # append result message
+            "type" => "function_call_output",
+            "output" => info[:content],
+            "call_id"=>"call_#{id}",
+          }
+        else
+          message
+        end
+      end.flatten
+    end
+    def self.process_response(response, &block)
+      Log.debug "Respose: #{Log.fingerprint response}"
+      response['output'].collect do |output|
+        case output['type']
+        when 'message'
+          output['content'].collect do |content|
+            case content['type']
+            when 'output_text'
+              IndiferentHash.setup({role: 'assistant', content: content['text']})
+            end
+          end
+        when 'function_call'
+          LLM.call_tools [output], &block
+        when 'web_search_call'
+          next
+        else
+          eee output
+          raise
+        end
+      end.compact.flatten
+    end
+    def self.process_input(messages)
+      messages = self.tools_to_responses messages
+      messages.collect do |message|
+        IndiferentHash.setup(message)
+        if message[:role] == 'image'
+          path = message[:content]
+          if Open.remote?(path)
+            {role: :user, content: {type: :input_image, image_url: path }}
+          elsif Open.exists?(path)
+            path = self.encode_image(path)
+            {role: :user, content: [{type: :input_image, image_url: path }]}
+          else
+            raise
+          end
+        elsif message[:role] == 'pdf'
+          path = message[:content]
+          if Open.remote?(path)
+            {role: :user, content: {type: :input_file, file_url: path }}
+          elsif Open.exists?(path)
+            data = self.encode_pdf(path)
+            {role: :user, content: [{type: :input_file, file_data: data }]}
+          else
+            raise
+          end
+        elsif message[:role] == 'websearch'
+            {role: :tool, content: {type: "web_search_preview"} }
+        else
+          message
+        end
+      end.flatten
+    end
+    def self.ask(question, options = {}, &block)
+      original_options = options.dup
+      messages = LLM.chat(question)
+      options = options.merge LLM.options messages
+      tools = LLM.tools messages
+      associations = LLM.associations messages
+      client, url, key, model, log_errors, return_messages, format = IndiferentHash.process_options options,
+        :client, :url, :key, :model, :log_errors, :return_messages, :format,
+        log_errors: true
+      if client.nil?
+        url ||= Scout::Config.get(:url, :openai_ask, :ask, :openai, env: 'OPENAI_URL')
+        key ||= LLM.get_url_config(:key, url, :openai_ask, :ask, :openai, env: 'OPENAI_KEY')
+        client = LLM::OpenAI.client url, key, log_errors
+      end
+      if model.nil?
+        url ||= Scout::Config.get(:url, :openai_ask, :ask, :openai, env: 'OPENAI_URL')
+        model ||= LLM.get_url_config(:model, url, :openai_ask, :ask, :openai, env: 'OPENAI_MODEL', default: "gpt-4.1")
+      end
+      case format
+      when :json, :json_object, "json", "json_object"
+        options['text'] = {format: {type: 'json_object'}}
+      when String, Symbol
+        options['text'] = {format: {type: format}}
+      when Hash
+        if format.include?('format')
+          options['text'] = format
+        elsif format['type'] == 'json_schema'
+          options['text'] = {format: format}
+        else
+          options['text'] = {format: {name: "response_schema",
+                                      type: "json_schema",
+                                      additionalProperties: false,
+                                      required: format['properties'].keys,
+                                      schema: format,
+          }}
+        end
+      end if format
+      parameters = options.merge(model: model)
+      if tools.any? || associations.any?
+        parameters[:tools] ||= []
+        parameters[:tools] += tools.values.collect{|a| a.last } if tools
+        parameters[:tools] += associations.values.collect{|a| a.last } if associations
+        parameters[:tools] = parameters[:tools].collect{|tool|
+          function = tool.delete :function;
+          tool.merge function
+        }
+        if not block_given?
+          block = Proc.new do |name,parameters|
+            IndiferentHash.setup parameters
+            if tools[name]
+              workflow = tools[name].first
+              jobname = parameters.delete :jobname
+              workflow.job(name, jobname, parameters).run
+            else
+              kb = associations[name].first
+              entities, reverse = IndiferentHash.process_options parameters, :entities, :reverse
+              if reverse
+                kb.parents(name, entities)
+              else
+                kb.children(name, entities)
+              end
+            end
+          end
+        end
+      end
+      Log.low "Calling client with parameters #{Log.fingerprint parameters}\n#{LLM.print messages}"
+      messages = self.process_input messages
+      input = []
+      messages.each do |message|
+        parameters[:tools] ||= []
+        if message[:role].to_s == 'tool'
+          parameters[:tools] << message[:content]
+        else
+          input << message
+        end
+      end
+      parameters[:input] = input
+      response = client.responses.create(parameters: parameters)
+      response = self.process_response response, &block
+      res = if response.last[:role] == 'function_call_output'
+              response + self.ask(messages + response, original_options.except(:tool_choice).merge(return_messages: true, tools: parameters[:tools]), &block)
+            else
+              response
+            end
+      if return_messages
+        res
+      else
+        res.last['content']
+      end
+    end
+  end
+  def self.image(question, options = {}, &block)
+    original_options = options.dup
+    messages = LLM.chat(question)
+    options = options.merge LLM.options messages
+    tools = LLM.tools messages
+    associations = LLM.associations messages
+    client, url, key, model, log_errors, return_messages, format = IndiferentHash.process_options options,
+      :client, :url, :key, :model, :log_errors, :return_messages, :format,
+      log_errors: true
+    if client.nil?
+      url ||= Scout::Config.get(:url, :openai_ask, :ask, :openai, env: 'OPENAI_URL')
+      key ||= LLM.get_url_config(:key, url, :openai_ask, :ask, :openai, env: 'OPENAI_KEY')
+      client = LLM::OpenAI.client url, key, log_errors
+    end
+    if model.nil?
+      url ||= Scout::Config.get(:url, :openai_ask, :ask, :openai, env: 'OPENAI_URL')
+      model ||= LLM.get_url_config(:model, url, :openai_ask, :ask, :openai, env: 'OPENAI_MODEL', default: "gpt-image-1")
+    end
+    messages = self.process_input messages
+    input = []
+    messages.each do |message|
+      parameters[:tools] ||= []
+      if message[:role].to_s == 'tool'
+        parameters[:tools] << message[:content]
+      else
+        input << message
+      end
+    end
+    parameters[:prompt] = LLM.print(input)
+    response = client.images.generate(parameters: parameters)
+    response[0]['b64_json']
+  end
+end