RubyGems - llm.rb - Versions diffs - 0.4.2 → 0.5.0 - Mend

llm.rb 0.4.2 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

checksums.yaml +4 -4
data/README.md +132 -84
data/lib/json/schema/array.rb +5 -0
data/lib/json/schema/boolean.rb +4 -0
data/lib/json/schema/integer.rb +23 -1
data/lib/json/schema/leaf.rb +11 -0
data/lib/json/schema/null.rb +4 -0
data/lib/json/schema/number.rb +23 -1
data/lib/json/schema/object.rb +6 -2
data/lib/json/schema/string.rb +26 -1
data/lib/json/schema/version.rb +2 -0
data/lib/json/schema.rb +10 -10
data/lib/llm/buffer.rb +28 -10
data/lib/llm/chat.rb +26 -1
data/lib/llm/core_ext/ostruct.rb +14 -8
data/lib/llm/file.rb +6 -1
data/lib/llm/function.rb +81 -0
data/lib/llm/message.rb +46 -1
data/lib/llm/providers/anthropic/format/completion_format.rb +73 -0
data/lib/llm/providers/anthropic/format.rb +7 -33
data/lib/llm/providers/anthropic/response_parser/completion_parser.rb +51 -0
data/lib/llm/providers/anthropic/response_parser.rb +1 -9
data/lib/llm/providers/anthropic.rb +4 -3
data/lib/llm/providers/gemini/audio.rb +4 -4
data/lib/llm/providers/gemini/files.rb +5 -4
data/lib/llm/providers/gemini/format/completion_format.rb +54 -0
data/lib/llm/providers/gemini/format.rb +28 -27
data/lib/llm/providers/gemini/images.rb +9 -4
data/lib/llm/providers/gemini/response_parser/completion_parser.rb +46 -0
data/lib/llm/providers/gemini/response_parser.rb +13 -20
data/lib/llm/providers/gemini.rb +3 -12
data/lib/llm/providers/ollama/format/completion_format.rb +72 -0
data/lib/llm/providers/ollama/format.rb +10 -30
data/lib/llm/providers/ollama/response_parser/completion_parser.rb +42 -0
data/lib/llm/providers/ollama/response_parser.rb +8 -11
data/lib/llm/providers/ollama.rb +3 -11
data/lib/llm/providers/openai/audio.rb +6 -6
data/lib/llm/providers/openai/files.rb +3 -3
data/lib/llm/providers/openai/format/completion_format.rb +81 -0
data/lib/llm/providers/openai/format/respond_format.rb +69 -0
data/lib/llm/providers/openai/format.rb +25 -58
data/lib/llm/providers/openai/images.rb +4 -2
data/lib/llm/providers/openai/response_parser/completion_parser.rb +55 -0
data/lib/llm/providers/openai/response_parser/respond_parser.rb +56 -0
data/lib/llm/providers/openai/response_parser.rb +8 -44
data/lib/llm/providers/openai/responses.rb +10 -11
data/lib/llm/providers/openai.rb +5 -16
data/lib/llm/response/{output.rb → respond.rb} +2 -2
data/lib/llm/response.rb +1 -1
data/lib/llm/version.rb +1 -1
data/lib/llm.rb +28 -0
data/llm.gemspec +1 -0
metadata +28 -3

data/lib/llm/buffer.rb CHANGED Viewed

@@ -28,6 +28,22 @@ module LLM
       @completed.each { yield(_1) }
     end
+    ##
+    # Returns an array of unread messages
+    # @see LLM::Message#read?
+    # @see LLM::Message#read!
+    # @return [Array<LLM::Message>]
+    def unread
+      reject(&:read?)
+    end
+    ##
+    # Find a message (in descending order)
+    # @return [LLM::Message, nil]
+    def find(...)
+      reverse_each.find(...)
+    end
     ##
     # @param [[LLM::Message, Hash]] item
     #  A message and its parameters
@@ -48,7 +64,7 @@ module LLM
     private
     def empty!
-      message, params, method = @pending[-1]
+      message, params, method = @pending.pop
       if method == :complete
         complete!(message, params)
       elsif method == :respond
@@ -59,24 +75,26 @@ module LLM
     end
     def complete!(message, params)
-      messages = @pending[0..-2].map { _1[0] }
+      pendings = @pending.map { _1[0] }
+      messages = [*@completed, *pendings]
       completion = @provider.complete(
         message.content,
         message.role,
         **params.merge(messages:)
       )
-      @completed.concat([*messages, message, completion.choices[0]])
+      @completed.concat([*pendings, message, completion.choices[0]])
       @pending.clear
     end
     def respond!(message, params)
-      input = @pending[0..-2].map { _1[0] }
-      @response = @provider.responses.create(
-        message.content,
-        message.role,
-        **params.merge(input:).merge(@response ? {previous_response_id: @response.id} : {})
-      )
-      @completed.concat([*input, message, @response.outputs[0]])
+      pendings = @pending.map { _1[0] }
+      input = [*pendings]
+      params = [
+        params.merge(input:),
+        @response ? {previous_response_id: @response.id} : {}
+      ].inject({}, &:merge!)
+      @response = @provider.responses.create(message.content, message.role, **params)
+      @completed.concat([*pendings, message, @response.outputs[0]])
       @pending.clear
     end
   end

data/lib/llm/chat.rb CHANGED Viewed

@@ -37,7 +37,7 @@ module LLM
       @provider = provider
       @params = params.merge!(model:, schema:)
       @lazy = false
-      @messages = []
+      @messages = [].extend(Array)
     end
     ##
@@ -108,14 +108,39 @@ module LLM
       @lazy
     end
+    ##
+    # @return [String]
     def inspect
       "#<#{self.class.name}:0x#{object_id.to_s(16)} " \
       "@provider=#{@provider.class}, @params=#{@params.inspect}, " \
       "@messages=#{@messages.inspect}, @lazy=#{@lazy.inspect}>"
     end
+    ##
+    # Returns an array of functions that have yet to be called
+    # @return [Array<LLM::Function>]
+    def functions
+      messages
+        .select(&:assistant?)
+        .flat_map(&:functions)
+        .reject(&:called?)
+    end
     private
+    ##
+    # @private
+    module Array
+      def find(...)
+        reverse_each.find(...)
+      end
+      def unread
+        reject(&:read?)
+      end
+    end
+    private_constant :Array
     def respond!(prompt, role, params)
       @provider.responses.create(
         prompt,

data/lib/llm/core_ext/ostruct.rb CHANGED Viewed

@@ -8,17 +8,19 @@ class OpenStruct
     #   obj = OpenStruct.from_hash(person: {name: 'John'})
     #   obj.person.name  # => 'John'
     #   obj.person.class # => OpenStruct
-    # @param [Hash] hash_obj
+    # @param [Hash, Array] obj
     #   A Hash object
     # @return [OpenStruct]
-    #   An OpenStruct object initialized by visiting `hash_obj` with
-    #   recursion
-    def from_hash(hash_obj)
-      visited_object = {}
-      hash_obj.each do |key, value|
-        visited_object[key] = walk(value)
+    #   An OpenStruct object initialized by visiting `obj` with recursion
+    def from_hash(obj)
+      case obj
+      when self then from_hash(obj.to_h)
+      when Array then obj.map { |v| from_hash(v) }
+      else
+        visited = {}
+        obj.each { visited[_1] = walk(_2) }
+        new(visited)
       end
-      new(visited_object)
     end
     private
@@ -34,4 +36,8 @@ class OpenStruct
     end
   end
   extend FromHash
+  def to_json(...)
+    to_h.to_json(...)
+  end
 end

data/lib/llm/file.rb CHANGED Viewed

@@ -72,5 +72,10 @@ end
 #  The path to a file
 # @return [LLM::File]
 def LLM.File(path)
-  LLM::File.new(path)
+  case path
+  when LLM::File, LLM::Response::File
+    path
+  else
+    LLM::File.new(path)
+  end
 end

data/lib/llm/function.rb ADDED Viewed

@@ -0,0 +1,81 @@
+# frozen_string_literal: true
+class LLM::Function
+  class Return < Struct.new(:id, :value)
+  end
+  ##
+  # Returns function arguments
+  # @return [Array, nil]
+  attr_accessor :arguments
+  ##
+  # Returns the function ID
+  # @return [String, nil]
+  attr_accessor :id
+  ##
+  # @param [String] name The function name
+  # @yieldparam [LLM::Function] self The function object
+  def initialize(name, &b)
+    @name = name
+    @schema = JSON::Schema.new
+    yield(self)
+  end
+  ##
+  # Set the function description
+  # @param [String] str The function description
+  # @return [void]
+  def description(str)
+    @description = str
+  end
+  ##
+  # @yieldparam [JSON::Schema] schema The schema object
+  # @return [void]
+  def params
+    @params = yield(@schema)
+  end
+  ##
+  # Set the function implementation
+  # @param [Proc] b The function implementation
+  # @return [void]
+  def define(&b)
+    @runner = b
+  end
+  ##
+  # Call the function
+  # @param [Array] args The arguments to pass to the function
+  # @return [Object] The result of the function call
+  def call
+    Return.new id, @runner.call(arguments)
+  ensure
+    @called = true
+  end
+  ##
+  # Returns true when a function has been called
+  # @return [Boolean]
+  def called?
+    @called
+  end
+  ##
+  # @return [Hash]
+  def format(provider)
+    case provider.class.to_s
+    when "LLM::Gemini"
+      {name: @name, description: @description, parameters: @params}.compact
+    when "LLM::Anthropic"
+      {name: @name, description: @description, input_schema: @params}.compact
+    else
+      {
+        type: "function", name: @name,
+        function: {name: @name, description: @description, parameters: @params}
+      }.compact
+    end
+  end
+end

data/lib/llm/message.rb CHANGED Viewed

@@ -64,12 +64,57 @@ module LLM
       role == "assistant" || role == "model"
     end
+    ##
+    # @return [Array<LLM::Function>]
+    def functions
+      @functions ||= tool_calls.map do |fn|
+        function = LLM.functions[fn.name].dup
+        function.tap { _1.id = fn.id }
+        function.tap { _1.arguments = fn.arguments }
+      end
+    end
+    ##
+    # @return [Boolean]
+    #  Returns true when the message requests a function call
+    def tool_call?
+      tool_calls.any?
+    end
+    ##
+    # Returns true when the message is a system message
+    # @return [Boolean]
+    def system?
+      role == "system"
+    end
+    ##
+    # Marks the message as read
+    # @return [void]
+    def read!
+      @read = true
+    end
+    ##
+    # Returns true when the message has been read
+    # @return [Boolean]
+    def read?
+      @read
+    end
     ##
     # Returns a string representation of the message
     # @return [String]
     def inspect
       "#<#{self.class.name}:0x#{object_id.to_s(16)} " \
-      "role=#{role.inspect} content=#{content.inspect}>"
+      "tool_call=#{tool_calls.any?} role=#{role.inspect} " \
+      "content=#{content.inspect}>"
+    end
+    private
+    def tool_calls
+      @tool_calls ||= OpenStruct.from_hash(@extra[:tool_calls] || [])
     end
   end
 end

data/lib/llm/providers/anthropic/format/completion_format.rb ADDED Viewed

@@ -0,0 +1,73 @@
+# frozen_string_literal: true
+module LLM::Anthropic::Format
+  ##
+  # @private
+  class CompletionFormat
+    ##
+    # @param [LLM::Message, Hash] message
+    #  The message to format
+    def initialize(message)
+      @message = message
+    end
+    ##
+    # Formats the message for the Anthropic chat completions API
+    # @return [Hash]
+    def format
+      catch(:abort) do
+        if Hash === message
+          {role: message[:role], content: format_content(message[:content])}
+        else
+          format_message
+        end
+      end
+    end
+    private
+    def format_message
+      if message.tool_call?
+        {role: message.role, content: message.extra[:original_tool_calls]}
+      else
+        {role: message.role, content: format_content(content)}
+      end
+    end
+    ##
+    # @param [String, URI] content
+    #  The content to format
+    # @return [String, Hash]
+    #  The formatted content
+    def format_content(content)
+      case content
+      when Hash
+        content.empty? ? throw(:abort, nil) : [content]
+      when Array
+        content.empty? ? throw(:abort, nil) : content.flat_map { format_content(_1) }
+      when URI
+        [{type: :image, source: {type: "url", url: content.to_s}}]
+      when LLM::File
+        if content.image?
+          [{type: :image, source: {type: "base64", media_type: content.mime_type, data: content.to_b64}}]
+        else
+          raise LLM::Error::PromptError, "The given object (an instance of #{content.class}) " \
+                                          "is not an image, and therefore not supported by the " \
+                                          "Anthropic API"
+        end
+      when String
+        [{type: :text, text: content}]
+      when LLM::Message
+        format_content(content.content)
+      when LLM::Function::Return
+        {type: "tool_result", tool_use_id: content.id, content: content.value}
+      else
+        raise LLM::Error::PromptError, "The given object (an instance of #{content.class}) " \
+                                       "is not supported by the Anthropic API"
+      end
+    end
+    def message = @message
+    def content = message.content
+  end
+end

data/lib/llm/providers/anthropic/format.rb CHANGED Viewed

@@ -4,49 +4,23 @@ class LLM::Anthropic
   ##
   # @private
   module Format
+    require_relative "format/completion_format"
     ##
     # @param [Array<LLM::Message>] messages
     #  The messages to format
     # @return [Array<Hash>]
     def format(messages)
-      messages.map do
-        if Hash === _1
-          {role: _1[:role], content: format_content(_1[:content])}
-        else
-          {role: _1.role, content: format_content(_1.content)}
-        end
+      messages.filter_map do
+        CompletionFormat.new(_1).format
       end
     end
     private
-    ##
-    # @param [String, URI] content
-    #  The content to format
-    # @return [String, Hash]
-    #  The formatted content
-    def format_content(content)
-      case content
-      when Array
-        content.flat_map { format_content(_1) }
-      when URI
-        [{type: :image, source: {type: "url", url: content.to_s}}]
-      when LLM::File
-        if content.image?
-          [{type: :image, source: {type: "base64", media_type: content.mime_type, data: content.to_b64}}]
-        else
-          raise LLM::Error::PromptError, "The given object (an instance of #{content.class}) " \
-                                          "is not an image, and therefore not supported by the " \
-                                          "Anthropic API"
-        end
-      when String
-        [{type: :text, text: content}]
-      when LLM::Message
-        format_content(content.content)
-      else
-        raise LLM::Error::PromptError, "The given object (an instance of #{content.class}) " \
-                                       "is not supported by the Anthropic API"
-      end
+    def format_tools(tools)
+      return {} unless tools
+      {tools: tools.map { _1.format(self) }}
     end
   end
 end

data/lib/llm/providers/anthropic/response_parser/completion_parser.rb ADDED Viewed

@@ -0,0 +1,51 @@
+# frozen_string_literal: true
+module LLM::Anthropic::ResponseParser
+  ##
+  # @private
+  class CompletionParser
+    def initialize(body)
+      @body = OpenStruct.from_hash(body)
+    end
+    def format(response)
+      {
+        model:,
+        prompt_tokens:,
+        completion_tokens:,
+        total_tokens:,
+        choices: format_choices(response)
+      }
+    end
+    private
+    def format_choices(response)
+      texts.map.with_index do |choice, index|
+        extra = {index:, response:, tool_calls: format_tool_calls(tools), original_tool_calls: tools}
+        LLM::Message.new(role, choice.text, extra)
+      end
+    end
+    def format_tool_calls(tools)
+      (tools || []).filter_map do |tool|
+        tool = {
+          id: tool.id,
+          name: tool.name,
+          arguments: tool.input
+        }
+        OpenStruct.new(tool)
+      end
+    end
+    def body = @body
+    def role = body.role
+    def model = body.model
+    def prompt_tokens = body.usage.input_tokens
+    def completion_tokens = body.usage.output_tokens
+    def total_tokens = body.usage.total_tokens
+    def parts = body.content
+    def texts = parts.select { _1["type"] == "text" }
+    def tools = parts.select { _1["type"] == "tool_use" }
+  end
+end

data/lib/llm/providers/anthropic/response_parser.rb CHANGED Viewed

@@ -17,15 +17,7 @@ class LLM::Anthropic
     #  The response body from the LLM provider
     # @return [Hash]
     def parse_completion(body)
-      {
-        model: body["model"],
-        choices: body["content"].map do
-          # TODO: don't hardcode role
-          LLM::Message.new("assistant", _1["text"], {response: self})
-        end,
-        prompt_tokens: body.dig("usage", "input_tokens"),
-        completion_tokens: body.dig("usage", "output_tokens")
-      }
+      CompletionParser.new(body).format(self)
     end
   end
 end

data/lib/llm/providers/anthropic.rb CHANGED Viewed

@@ -7,6 +7,7 @@ module LLM
   class Anthropic < Provider
     require_relative "anthropic/error_handler"
     require_relative "anthropic/response_parser"
+    require_relative "anthropic/response_parser/completion_parser"
     require_relative "anthropic/format"
     require_relative "anthropic/models"
     include Format
@@ -49,11 +50,11 @@ module LLM
     # @raise [LLM::Error::PromptError]
     #  When given an object a provider does not understand
     # @return (see LLM::Provider#complete)
-    def complete(prompt, role = :user, model: default_model, max_tokens: 1024, **params)
-      params = {max_tokens:, model:}.merge!(params)
+    def complete(prompt, role = :user, model: default_model, max_tokens: 1024, tools: nil, **params)
+      params = [{max_tokens:, model:}, format_tools(tools), params].inject({}, &:merge!).compact
       req = Net::HTTP::Post.new("/v1/messages", headers)
       messages = [*(params.delete(:messages) || []), Message.new(role, prompt)]
-      body = JSON.dump({messages: format(messages)}.merge!(params))
+      body = JSON.dump({messages: [format(messages)].flatten}.merge!(params))
       set_body_stream(req, StringIO.new(body))
       res = request(@http, req)
       Response::Completion.new(res).extend(response_parser)

data/lib/llm/providers/gemini/audio.rb CHANGED Viewed

@@ -34,7 +34,7 @@ class LLM::Gemini
     #   res = llm.audio.create_transcription(file: LLM::File("/rocket.mp3"))
     #   res.text # => "A dog on a rocket to the moon"
     # @see https://ai.google.dev/gemini-api/docs/audio Gemini docs
-    # @param [LLM::File, LLM::Response::File] file The input audio
+    # @param [String, LLM::File, LLM::Response::File] file The input audio
     # @param [String] model The model to use
     # @param [Hash] params Other parameters (see Gemini docs)
     # @raise (see LLM::Provider#request)
@@ -43,7 +43,7 @@ class LLM::Gemini
       res = @provider.complete [
         "Your task is to transcribe the contents of an audio file",
         "Your response should include the transcription, and nothing else",
-        file
+        LLM.File(file)
       ], :user, model:, **params
       LLM::Response::AudioTranscription
         .new(res)
@@ -58,7 +58,7 @@ class LLM::Gemini
     #   res = llm.audio.create_translation(file: LLM::File("/bismillah.mp3"))
     #   res.text # => "In the name of Allah, the Beneficent, the Merciful."
     # @see https://ai.google.dev/gemini-api/docs/audio Gemini docs
-    # @param [LLM::File, LLM::Response::File] file The input audio
+    # @param [String, LLM::File, LLM::Response::File] file The input audio
     # @param [String] model The model to use
     # @param [Hash] params Other parameters (see Gemini docs)
     # @raise (see LLM::Provider#request)
@@ -67,7 +67,7 @@ class LLM::Gemini
       res = @provider.complete [
         "Your task is to translate the contents of an audio file into English",
         "Your response should include the translation, and nothing else",
-        file
+        LLM.File(file)
       ], :user, model:, **params
       LLM::Response::AudioTranslation
         .new(res)

data/lib/llm/providers/gemini/files.rb CHANGED Viewed

@@ -19,7 +19,7 @@ class LLM::Gemini
   #
   #   llm = LLM.gemini(ENV["KEY"])
   #   bot = LLM::Chat.new(llm).lazy
-  #   file = llm.files.create file: LLM::File("/audio/haiku.mp3")
+  #   file = llm.files.create file: "/audio/haiku.mp3"
   #   bot.chat(file)
   #   bot.chat("Describe the audio file I sent to you")
   #   bot.chat("The audio file is the first message I sent to you.")
@@ -30,7 +30,7 @@ class LLM::Gemini
   #
   #   llm = LLM.gemini(ENV["KEY"])
   #   bot = LLM::Chat.new(llm).lazy
-  #   file = llm.files.create file: LLM::File("/audio/haiku.mp3")
+  #   file = llm.files.create file: "/audio/haiku.mp3"
   #   bot.chat(["Describe the audio file I sent to you", file])
   #   bot.messages.select(&:assistant?).each { print "[#{_1.role}]", _1.content, "\n" }
   class Files
@@ -71,13 +71,14 @@ class LLM::Gemini
     # Create a file
     # @example
     #   llm = LLM.gemini(ENV["KEY"])
-    #   res = llm.files.create file: LLM::File("/audio/haiku.mp3"),
+    #   res = llm.files.create file: "/audio/haiku.mp3"
     # @see https://ai.google.dev/gemini-api/docs/files Gemini docs
-    # @param [File] file The file
+    # @param [String, LLM::File] file The file
     # @param [Hash] params Other parameters (see Gemini docs)
     # @raise (see LLM::Provider#request)
     # @return [LLM::Response::File]
     def create(file:, **params)
+      file = LLM.File(file)
       req = Net::HTTP::Post.new(request_upload_url(file:), {})
       req["content-length"] = file.bytesize
       req["X-Goog-Upload-Offset"] = 0

data/lib/llm/providers/gemini/format/completion_format.rb ADDED Viewed

@@ -0,0 +1,54 @@
+# frozen_string_literal: true
+module LLM::Gemini::Format
+  ##
+  # @private
+  class CompletionFormat
+    ##
+    # @param [LLM::Message, Hash] message
+    #  The message to format
+    def initialize(message)
+      @message = message
+    end
+    ##
+    # Formats the message for the Gemini chat completions API
+    # @return [Hash]
+    def format
+      catch(:abort) do
+        if Hash === message
+          {role: message[:role], parts: format_content(message[:content])}
+        elsif message.tool_call?
+          {role: message.role, parts: message.extra[:original_tool_calls].map { {"functionCall" => _1} }}
+        else
+          {role: message.role, parts: format_content(message.content)}
+        end
+      end
+    end
+    def format_content(content)
+      case content
+      when Array
+        content.empty? ? throw(:abort, nil) : content.flat_map { format_content(_1) }
+      when LLM::Response::File
+        file = content
+        [{file_data: {mime_type: file.mime_type, file_uri: file.uri}}]
+      when LLM::File
+        file = content
+        [{inline_data: {mime_type: file.mime_type, data: file.to_b64}}]
+      when String
+        [{text: content}]
+      when LLM::Message
+        format_content(content.content)
+      when LLM::Function::Return
+        [{text: content.value}]
+      else
+        raise LLM::Error::PromptError, "The given object (an instance of #{content.class}) " \
+                                       "is not supported by the Gemini API"
+      end
+    end
+    def message = @message
+    def content = message.content
+  end
+end