RubyGems - ruby_llm - Versions diffs - 0.1.0.pre3 → 0.1.0.pre5 - Mend

ruby_llm 0.1.0.pre3 → 0.1.0.pre5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

checksums.yaml +4 -4
data/.github/workflows/gem-push.yml +1 -1
data/.github/workflows/test.yml +5 -2
data/.overcommit.yml +1 -1
data/README.md +56 -181
data/bin/console +6 -0
data/lib/ruby_llm/chat.rb +95 -0
data/lib/ruby_llm/chunk.rb +6 -0
data/lib/ruby_llm/configuration.rb +2 -4
data/lib/ruby_llm/message.rb +26 -20
data/lib/ruby_llm/model_capabilities/anthropic.rb +43 -48
data/lib/ruby_llm/model_capabilities/openai.rb +82 -89
data/lib/ruby_llm/model_info.rb +26 -17
data/lib/ruby_llm/models.json +686 -0
data/lib/ruby_llm/models.rb +52 -0
data/lib/ruby_llm/provider.rb +99 -0
data/lib/ruby_llm/providers/anthropic.rb +97 -193
data/lib/ruby_llm/providers/openai.rb +125 -142
data/lib/ruby_llm/tool.rb +71 -50
data/lib/ruby_llm/version.rb +1 -1
data/lib/ruby_llm.rb +35 -37
data/lib/tasks/models.rake +25 -0
data/ruby_llm.gemspec +1 -0
metadata +32 -8
data/lib/ruby_llm/active_record/acts_as.rb +0 -115
data/lib/ruby_llm/client.rb +0 -67
data/lib/ruby_llm/conversation.rb +0 -19
data/lib/ruby_llm/model_capabilities/base.rb +0 -35
data/lib/ruby_llm/providers/base.rb +0 -60

data/lib/ruby_llm/models.rb ADDED Viewed

@@ -0,0 +1,52 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Models
+    module_function
+    def provider_for(model)
+      Provider.for(model)
+    end
+    def all
+      @all ||= begin
+        data = JSON.parse(File.read(File.expand_path('models.json', __dir__)))
+        data['models'].map { |model| ModelInfo.new(model.transform_keys(&:to_sym)) }
+      end
+    rescue Errno::ENOENT
+      [] # Return empty array if file doesn't exist yet
+    end
+    def find(model_id)
+      all.find { |m| m.id == model_id } or raise Error, "Unknown model: #{model_id}"
+    end
+    def chat_models
+      all.select { |m| m.type == 'chat' }
+    end
+    def embedding_models
+      all.select { |m| m.type == 'embedding' }
+    end
+    def audio_models
+      all.select { |m| m.type == 'audio' }
+    end
+    def image_models
+      all.select { |m| m.type == 'image' }
+    end
+    def by_family(family)
+      all.select { |m| m.family == family }
+    end
+    def default_model
+      'gpt-4o-mini'
+    end
+    def refresh!
+      @all = nil
+    end
+  end
+end

data/lib/ruby_llm/provider.rb ADDED Viewed

@@ -0,0 +1,99 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Provider
+    def self.included(base)
+      base.include(InstanceMethods)
+    end
+    module InstanceMethods
+      def complete(messages, tools: [], model: nil, &block)
+        # TODO: refactor
+        payload = build_payload(messages, tools, model: model, stream: block_given?)
+        content = String.new
+        model_id = nil
+        input_tokens = 0
+        output_tokens = 0
+        response = connection.post(completion_url, payload) do |req|
+          req.headers.merge! headers
+          if block_given?
+            req.options.on_data = handle_stream do |chunk|
+              model_id ||= chunk.model_id
+              content << (chunk.content || '')
+              input_tokens += chunk.input_tokens if chunk.input_tokens
+              output_tokens += chunk.output_tokens if chunk.output_tokens
+              block.call(chunk)
+            end
+          end
+        end
+        if block_given?
+          Message.new(
+            role: :assistant,
+            content: content,
+            model_id: model_id,
+            input_tokens: input_tokens.positive? ? input_tokens : nil,
+            output_tokens: output_tokens.positive? ? output_tokens : nil
+          )
+        else
+          parse_completion_response(response)
+        end
+      end
+      def list_models
+        response = connection.get(models_url) do |req|
+          req.headers.merge!(headers)
+        end
+        parse_list_models_response(response)
+      end
+      private
+      def connection
+        @connection ||= Faraday.new(api_base) do |f|
+          f.options.timeout = RubyLLM.config.request_timeout
+          f.request :json
+          f.response :json
+          f.adapter Faraday.default_adapter
+          f.use Faraday::Response::RaiseError
+          f.response :logger, RubyLLM.logger, { headers: false, bodies: true, errors: true, log_level: :debug }
+        end
+      end
+      def to_json_stream(&block)
+        parser = EventStreamParser::Parser.new
+        proc do |chunk, _bytes, _|
+          parser.feed(chunk) do |_type, data|
+            unless data == '[DONE]'
+              parsed_data = JSON.parse(data)
+              RubyLLM.logger.debug "chunk: #{parsed_data}"
+              block.call(parsed_data)
+            end
+          end
+        end
+      end
+    end
+    class << self
+      def register(name, provider_class)
+        providers[name.to_sym] = provider_class
+      end
+      def for(model)
+        model_info = Models.find(model)
+        provider_class = providers[model_info.provider.to_sym] or
+          raise Error, "No provider registered for #{model_info.provider}"
+        provider_class.new
+      end
+      private
+      def providers
+        @providers ||= {}
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/anthropic.rb CHANGED Viewed

@@ -1,51 +1,82 @@
 # frozen_string_literal: true
-require 'time'
 module RubyLLM
   module Providers
-    class Anthropic < Base
-      def chat(messages, model: nil, temperature: 0.7, stream: false, tools: nil, &block)
-        payload = {
-          model: model || 'claude-3-5-sonnet-20241022',
-          messages: format_messages(messages),
-          temperature: temperature,
-          stream: stream,
-          max_tokens: 4096
+    class Anthropic
+      include Provider
+      private
+      def api_base
+        'https://api.anthropic.com'
+      end
+      def headers
+        {
+          'x-api-key' => RubyLLM.config.anthropic_api_key,
+          'anthropic-version' => '2023-06-01'
         }
+      end
-        payload[:tools] = tools.map { |tool| tool_to_anthropic(tool) } if tools&.any?
+      def completion_url
+        '/v1/messages'
+      end
-        puts 'Sending payload to Anthropic:' if ENV['RUBY_LLM_DEBUG']
-        puts JSON.pretty_generate(payload) if ENV['RUBY_LLM_DEBUG']
+      def models_url
+        '/v1/models'
+      end
-        if stream && block_given?
-          stream_chat_completion(payload, tools, &block)
-        else
-          create_chat_completion(payload, tools)
+      def build_payload(messages, tools, model:, temperature: 0.7, stream: false)
+        {
+          model: model,
+          messages: format_messages(messages),
+          temperature: temperature,
+          stream: stream,
+          max_tokens: RubyLLM.models.find(model).max_tokens
+        }.tap do |payload|
+          payload[:tools] = tools.map { |t| function_for(t) } if tools.any?
         end
       end
-      def list_models
-        response = @connection.get('/v1/models') do |req|
-          req.headers['x-api-key'] = RubyLLM.configuration.anthropic_api_key
-          req.headers['anthropic-version'] = '2023-06-01'
+      def parse_completion_response(response)
+        data = response.body
+        content_blocks = data['content'] || []
+        text_content = content_blocks.find { |c| c['type'] == 'text' }&.fetch('text', '')
+        tool_use = content_blocks.find { |c| c['type'] == 'tool_use' }
+        if tool_use
+          Message.new(
+            role: :assistant,
+            content: text_content,
+            tool_calls: [
+              {
+                name: tool_use['name'],
+                arguments: JSON.generate(tool_use['input'] || {})
+              }
+            ]
+          )
+        else
+          Message.new(
+            role: :assistant,
+            content: text_content,
+            input_tokens: data['usage']['input_tokens'],
+            output_tokens: data['usage']['output_tokens'],
+            model_id: data['model']
+          )
         end
+      end
-        raise RubyLLM::Error, "API error: #{parse_error_message(response)}" if response.status >= 400
-        capabilities = RubyLLM::ModelCapabilities::Anthropic.new
-        models_data = response.body['data'] || []
+      def parse_models_response(response)
+        capabilities = ModelCapabilities::Anthropic.new
-        models_data.map do |model|
+        (response.body['data'] || []).map do |model|
           ModelInfo.new(
             id: model['id'],
             created_at: Time.parse(model['created_at']),
             display_name: model['display_name'],
             provider: 'anthropic',
-            metadata: {
-              type: model['type']
-            },
+            metadata: { type: model['type'] },
             context_window: capabilities.determine_context_window(model['id']),
             max_tokens: capabilities.determine_max_tokens(model['id']),
             supports_vision: capabilities.supports_vision?(model['id']),
@@ -55,199 +86,72 @@ module RubyLLM
             output_price_per_million: capabilities.get_output_price(model['id'])
           )
         end
-      rescue Faraday::Error => e
-        handle_error(e)
       end
-      private
+      def handle_stream(&block)
+        to_json_stream do |data|
+          block.call(
+            Chunk.new(
+              role: :assistant,
+              model_id: data.dig('message', 'model'),
+              content: data.dig('delta', 'text'),
+              input_tokens: data.dig('message', 'usage', 'input_tokens'),
+              output_tokens: data.dig('message', 'usage', 'output_tokens') || data.dig('usage', 'output_tokens')
+            )
+          )
+        end
+      end
-      def tool_to_anthropic(tool)
+      def function_for(tool)
         {
           name: tool.name,
           description: tool.description,
           input_schema: {
             type: 'object',
-            properties: tool.parameters,
-            required: tool.parameters.select { |_, v| v[:required] }.keys
+            properties: clean_parameters(tool.parameters),
+            required: required_parameters(tool.parameters)
           }
         }
       end
       def format_messages(messages)
         messages.map do |msg|
-          message = { role: msg.role == :user ? 'user' : 'assistant' }
-          message[:content] = if msg.tool_results
-                                [
-                                  {
-                                    type: 'tool_result',
-                                    tool_use_id: msg.tool_results[:tool_use_id],
-                                    content: msg.tool_results[:content],
-                                    is_error: msg.tool_results[:is_error]
-                                  }.compact
-                                ]
-                              else
-                                msg.content
-                              end
-          message
-        end
-      end
-      def create_chat_completion(payload, tools = nil)
-        response = @connection.post('/v1/messages') do |req|
-          req.headers['x-api-key'] = RubyLLM.configuration.anthropic_api_key
-          req.headers['anthropic-version'] = '2023-06-01'
-          req.headers['Content-Type'] = 'application/json'
-          req.body = payload
-        end
-        puts 'Response from Anthropic:' if ENV['RUBY_LLM_DEBUG']
-        puts JSON.pretty_generate(response.body) if ENV['RUBY_LLM_DEBUG']
-        handle_response(response, tools, payload)
-      rescue Faraday::Error => e
-        handle_error(e)
-      end
-      def stream_chat_completion(payload, tools = nil)
-        response = @connection.post('/v1/messages') do |req|
-          req.headers['x-api-key'] = RubyLLM.configuration.anthropic_api_key
-          req.headers['anthropic-version'] = '2023-06-01'
-          req.body = payload
-        end
-        response.body.each_line do |line|
-          next if line.strip.empty?
-          next if line == 'data: [DONE]'
-          begin
-            data = JSON.parse(line.sub(/^data: /, ''))
-            if data['type'] == 'content_block_delta'
-              content = data['delta']['text']
-              yield Message.new(role: :assistant, content: content) if content
-            elsif data['type'] == 'tool_call'
-              handle_tool_calls(data['tool_calls'], tools) do |result|
-                yield Message.new(role: :assistant, content: result)
-              end
-            end
-          rescue JSON::ParserError
-            next
-          end
-        end
-      rescue Faraday::Error => e
-        handle_error(e)
-      end
-      def handle_response(response, tools, payload)
-        data = response.body
-        return Message.new(role: :assistant, content: '') if data['type'] == 'error'
-        # Extract text content and tool use from response
-        content_parts = data['content'] || []
-        text_content = content_parts.find { |c| c['type'] == 'text' }&.fetch('text', '')
-        tool_use = content_parts.find { |c| c['type'] == 'tool_use' }
-        if tool_use && tools
-          tool = tools.find { |t| t.name == tool_use['name'] }
-          result = if tool
-                     begin
-                       tool_result = tool.call(tool_use['input'] || {})
-                       {
-                         tool_use_id: tool_use['id'],
-                         content: tool_result.to_s
-                       }
-                     rescue StandardError => e
-                       {
-                         tool_use_id: tool_use['id'],
-                         content: "Error executing tool #{tool.name}: #{e.message}",
-                         is_error: true
-                       }
-                     end
-                   end
-          # Create a new message with the tool result
-          new_messages = payload[:messages] + [
-            { role: 'assistant', content: data['content'] },
+          if msg.tool_results
             {
-              role: 'user',
+              role: convert_role(msg.role),
               content: [
                 {
                   type: 'tool_result',
-                  tool_use_id: result[:tool_use_id],
-                  content: result[:content],
-                  is_error: result[:is_error]
+                  tool_use_id: msg.tool_results[:tool_use_id],
+                  content: msg.tool_results[:content],
+                  is_error: msg.tool_results[:is_error]
                 }.compact
               ]
             }
-          ]
-          return create_chat_completion(payload.merge(messages: new_messages), tools)
-        end
-        # Extract token usage from response
-        token_usage = if data['usage']
-                        {
-                          input_tokens: data['usage']['input_tokens'],
-                          output_tokens: data['usage']['output_tokens'],
-                          total_tokens: data['usage']['input_tokens'] + data['usage']['output_tokens']
-                        }
-                      end
-        Message.new(
-          role: :assistant,
-          content: text_content,
-          token_usage: token_usage,
-          model_id: data['model']
-        )
-      end
-      def handle_tool_calls(tool_calls, tools)
-        return [] unless tool_calls && tools
-        tool_calls.map do |tool_call|
-          tool = tools.find { |t| t.name == tool_call['name'] }
-          next unless tool
-          begin
-            args = JSON.parse(tool_call['arguments'])
-            result = tool.call(args)
-            puts "Tool result: #{result}" if ENV['RUBY_LLM_DEBUG']
-            {
-              tool_use_id: tool_call['id'],
-              content: result.to_s
-            }
-          rescue JSON::ParserError, ArgumentError => e
-            puts "Error executing tool: #{e.message}" if ENV['RUBY_LLM_DEBUG']
+          else
             {
-              tool_use_id: tool_call['id'],
-              content: "Error executing tool #{tool.name}: #{e.message}",
-              is_error: true
+              role: convert_role(msg.role),
+              content: msg.content
             }
           end
-        end.compact
+        end
       end
-      def handle_api_error(error)
-        response_body = error.response[:body]
-        if response_body.is_a?(String)
-          begin
-            error_data = JSON.parse(response_body)
-            message = error_data.dig('error', 'message')
-            raise RubyLLM::Error, "API error: #{message}" if message
-          rescue JSON::ParserError
-            raise RubyLLM::Error, "API error: #{error.response[:status]}"
-          end
-        elsif response_body.dig('error', 'type') == 'invalid_request_error'
-          raise RubyLLM::Error, "API error: #{response_body['error']['message']}"
-        else
-          raise RubyLLM::Error, "API error: #{error.response[:status]}"
+      def convert_role(role)
+        case role
+        when :user then 'user'
+        else 'assistant'
         end
       end
-      def api_base
-        'https://api.anthropic.com'
+      def clean_parameters(parameters)
+        parameters.transform_values do |props|
+          props.except(:required)
+        end
+      end
+      def required_parameters(parameters)
+        parameters.select { |_, props| props[:required] }.keys
       end
     end
   end