RubyGems - ruby_llm - Versions diffs - 1.0.1 → 1.1.0rc1 - Mend

ruby_llm 1.0.1 → 1.1.0rc1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

checksums.yaml +4 -4
data/README.md +28 -12
data/lib/ruby_llm/active_record/acts_as.rb +46 -7
data/lib/ruby_llm/aliases.json +65 -0
data/lib/ruby_llm/aliases.rb +56 -0
data/lib/ruby_llm/chat.rb +10 -9
data/lib/ruby_llm/configuration.rb +4 -0
data/lib/ruby_llm/error.rb +15 -4
data/lib/ruby_llm/models.json +1163 -303
data/lib/ruby_llm/models.rb +40 -11
data/lib/ruby_llm/provider.rb +32 -39
data/lib/ruby_llm/providers/anthropic/capabilities.rb +8 -9
data/lib/ruby_llm/providers/anthropic/chat.rb +31 -4
data/lib/ruby_llm/providers/anthropic/streaming.rb +12 -6
data/lib/ruby_llm/providers/anthropic.rb +4 -0
data/lib/ruby_llm/providers/bedrock/capabilities.rb +168 -0
data/lib/ruby_llm/providers/bedrock/chat.rb +108 -0
data/lib/ruby_llm/providers/bedrock/models.rb +84 -0
data/lib/ruby_llm/providers/bedrock/signing.rb +831 -0
data/lib/ruby_llm/providers/bedrock/streaming/base.rb +46 -0
data/lib/ruby_llm/providers/bedrock/streaming/content_extraction.rb +63 -0
data/lib/ruby_llm/providers/bedrock/streaming/message_processing.rb +79 -0
data/lib/ruby_llm/providers/bedrock/streaming/payload_processing.rb +90 -0
data/lib/ruby_llm/providers/bedrock/streaming/prelude_handling.rb +91 -0
data/lib/ruby_llm/providers/bedrock/streaming.rb +36 -0
data/lib/ruby_llm/providers/bedrock.rb +83 -0
data/lib/ruby_llm/providers/deepseek/chat.rb +17 -0
data/lib/ruby_llm/providers/deepseek.rb +5 -0
data/lib/ruby_llm/providers/gemini/capabilities.rb +50 -34
data/lib/ruby_llm/providers/gemini/chat.rb +8 -15
data/lib/ruby_llm/providers/gemini/images.rb +5 -10
data/lib/ruby_llm/providers/gemini/streaming.rb +35 -76
data/lib/ruby_llm/providers/gemini/tools.rb +12 -12
data/lib/ruby_llm/providers/gemini.rb +4 -0
data/lib/ruby_llm/providers/openai/capabilities.rb +146 -206
data/lib/ruby_llm/providers/openai/streaming.rb +9 -13
data/lib/ruby_llm/providers/openai.rb +4 -0
data/lib/ruby_llm/streaming.rb +96 -0
data/lib/ruby_llm/version.rb +1 -1
data/lib/ruby_llm.rb +6 -3
data/lib/tasks/browser_helper.rb +97 -0
data/lib/tasks/capability_generator.rb +123 -0
data/lib/tasks/capability_scraper.rb +224 -0
data/lib/tasks/cli_helper.rb +22 -0
data/lib/tasks/code_validator.rb +29 -0
data/lib/tasks/model_updater.rb +66 -0
data/lib/tasks/models.rake +28 -193
data/lib/tasks/vcr.rake +13 -30
metadata +27 -19
data/.github/workflows/cicd.yml +0 -158
data/.github/workflows/docs.yml +0 -53
data/.gitignore +0 -59
data/.overcommit.yml +0 -26
data/.rspec +0 -3
data/.rubocop.yml +0 -10
data/.yardopts +0 -12
data/CONTRIBUTING.md +0 -207
data/Gemfile +0 -33
data/Rakefile +0 -9
data/bin/console +0 -17
data/bin/setup +0 -6
data/ruby_llm.gemspec +0 -44

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: fd4d6fd8e0894176fff57bd2a3132b965afbb912108d45d94cba3b4b3106ff7c
-  data.tar.gz: 071a8ff4dcffcba66d042d3e822c2297b8a2c4485c4ee1fb48d0a03ec49c0547
+  metadata.gz: 7f1ca42c438f99a40f6ada6ab87e23377403d9d6c8db6049d54960308b6dd42f
+  data.tar.gz: 0467734c40a0a64505b8f4de2eea4b929e2b0c615fedb3fe88d75f8cf20040de
 SHA512:
-  metadata.gz: 5d995c552810743910286207c47d2342de7e2ee14b833b627267d4fcec3c02931650b499de048319de293914fd0c19689124f818e994e74de04e8c819b934e91
-  data.tar.gz: 85598c0a2b633092eb5d5fa5b13b59f03b2c3c5effd826f483d64b87f58b8caaf3637b28308d027eaeed3a03d708a0267b420556ca54206de9a9ac69ab97455c
+  metadata.gz: ed886fb15081ce27309c0e583223e62adf171907f0f047344763e9eae5ede4dbb96657bb1b69dde9e68bc1ed56acedb93717273067236e40104dddcc09886f33
+  data.tar.gz: 7f2aa9c50cfd1a525273256ff014712944c976229f6b90fe338decaf2525bcb82f19dec187d14795ce0891a7fceadb5c048905c8afa8066b0ddbe37d54c48edd

data/README.md CHANGED Viewed

@@ -2,17 +2,20 @@
 A delightful Ruby way to work with AI. No configuration madness, no complex callbacks, no handler hell – just beautiful, expressive Ruby code.
-<div style="display: flex; align-items: center; flex-wrap: wrap; gap: 4px;">
+<div style="display: flex; align-items: center; flex-wrap: wrap; margin-bottom: 1em">
   <img src="https://upload.wikimedia.org/wikipedia/commons/4/4d/OpenAI_Logo.svg" alt="OpenAI" height="40" width="120">
-  &nbsp;&nbsp;&nbsp;&nbsp;
+  &nbsp;&nbsp;
   <img src="https://upload.wikimedia.org/wikipedia/commons/7/78/Anthropic_logo.svg" alt="Anthropic" height="40" width="120">
-  &nbsp;&nbsp;&nbsp;&nbsp;
+  &nbsp;&nbsp;
   <img src="https://upload.wikimedia.org/wikipedia/commons/8/8a/Google_Gemini_logo.svg" alt="Google" height="40" width="120">
-  &nbsp;&nbsp;&nbsp;&nbsp;
+  &nbsp;&nbsp;
+  <img src="https://registry.npmmirror.com/@lobehub/icons-static-svg/latest/files/icons/bedrock-color.svg" alt="Bedrock" height="40">
+  <img src="https://registry.npmmirror.com/@lobehub/icons-static-svg/latest/files/icons/bedrock-text.svg" alt="Bedrock" height="40" width="120">
+  &nbsp;&nbsp;
   <img src="https://upload.wikimedia.org/wikipedia/commons/e/ec/DeepSeek_logo.svg" alt="DeepSeek" height="40" width="120">
 </div>
-<a href="https://badge.fury.io/rb/ruby_llm"><img src="https://badge.fury.io/rb/ruby_llm.svg?dummy=unused" alt="Gem Version" /></a>
+<a href="https://badge.fury.io/rb/ruby_llm"><img src="https://badge.fury.io/rb/ruby_llm.svg" alt="Gem Version" /></a>
 <a href="https://github.com/testdouble/standard"><img src="https://img.shields.io/badge/code_style-standard-brightgreen.svg" alt="Ruby Style Guide" /></a>
 <a href="https://rubygems.org/gems/ruby_llm"><img alt="Gem Downloads" src="https://img.shields.io/gem/dt/ruby_llm"></a>
 <a href="https://codecov.io/gh/crmne/ruby_llm"><img src="https://codecov.io/gh/crmne/ruby_llm/branch/main/graph/badge.svg" alt="codecov" /></a>
@@ -27,7 +30,7 @@ RubyLLM fixes all that. One beautiful API for everything. One consistent format.
 ## Features
-- 💬 **Chat** with OpenAI, Anthropic, Gemini, and DeepSeek models
+- 💬 **Chat** with OpenAI, Anthropic, Gemini, AWS Bedrock Anthropic, and DeepSeek models
 - 👁️ **Vision and Audio** understanding
 - 📄 **PDF Analysis** for analyzing documents
 - 🖼️ **Image generation** with DALL-E and other providers
@@ -99,10 +102,16 @@ Configure with your API keys:
 ```ruby
 RubyLLM.configure do |config|
-  config.openai_api_key = ENV['OPENAI_API_KEY']
-  config.anthropic_api_key = ENV['ANTHROPIC_API_KEY']
-  config.gemini_api_key = ENV['GEMINI_API_KEY']
-  config.deepseek_api_key = ENV['DEEPSEEK_API_KEY']
+  config.openai_api_key = ENV.fetch('OPENAI_API_KEY', nil)
+  config.anthropic_api_key = ENV.fetch('ANTHROPIC_API_KEY', nil)
+  config.gemini_api_key = ENV.fetch('GEMINI_API_KEY', nil)
+  config.deepseek_api_key = ENV.fetch('DEEPSEEK_API_KEY', nil)
+  # Bedrock
+  config.bedrock_api_key = ENV.fetch('AWS_ACCESS_KEY_ID', nil)
+  config.bedrock_secret_key = ENV.fetch('AWS_SECRET_ACCESS_KEY', nil)
+  config.bedrock_region = ENV.fetch('AWS_REGION', nil)
+  config.bedrock_session_token = ENV.fetch('AWS_SESSION_TOKEN', nil)
 end
 ```
@@ -126,6 +135,9 @@ chat.ask "Tell me a story about a Ruby programmer" do |chunk|
   print chunk.content
 end
+# Set personality or behavior with instructions (aka system prompts) - available from 1.1.0
+chat.with_instructions "You are a friendly Ruby expert who loves to help beginners"
 # Understand content in multiple forms
 chat.ask "Compare these diagrams", with: { image: ["diagram1.png", "diagram2.png"] }
 chat.ask "Summarize this document", with: { pdf: "contract.pdf" }
@@ -156,8 +168,12 @@ class ToolCall < ApplicationRecord
   acts_as_tool_call
 end
-# In your controller
-chat = Chat.create!(model_id: "gpt-4o-mini")
+# In a background job
+chat = Chat.create! model_id: "gpt-4o-mini"
+# Set personality or behavior with instructions (aka system prompts) - they're persisted too! - available from 1.1.0
+chat.with_instructions "You are a friendly Ruby expert who loves to help beginners"
 chat.ask("What's your favorite Ruby gem?") do |chunk|
   Turbo::StreamsChannel.broadcast_append_to(
     chat,

data/lib/ruby_llm/active_record/acts_as.rb CHANGED Viewed

@@ -9,7 +9,7 @@ module RubyLLM
       extend ActiveSupport::Concern
       class_methods do # rubocop:disable Metrics/BlockLength
-        def acts_as_chat(message_class: 'Message', tool_call_class: 'ToolCall') # rubocop:disable Metrics/MethodLength
+        def acts_as_chat(message_class: 'Message', tool_call_class: 'ToolCall')
           include ChatMethods
           @message_class = message_class.to_s
@@ -21,12 +21,6 @@ module RubyLLM
                    dependent: :destroy
           delegate :complete,
-                   :with_tool,
-                   :with_tools,
-                   :with_model,
-                   :with_temperature,
-                   :on_new_message,
-                   :on_end_message,
                    :add_message,
                    to: :to_llm
         end
@@ -85,6 +79,51 @@ module RubyLLM
              .on_end_message { |msg| persist_message_completion(msg) }
       end
+      def with_instructions(instructions, replace: false)
+        transaction do
+          # If replace is true, remove existing system messages
+          messages.where(role: :system).destroy_all if replace
+          # Create the new system message
+          messages.create!(
+            role: :system,
+            content: instructions
+          )
+        end
+        to_llm.with_instructions(instructions)
+        self
+      end
+      def with_tool(tool)
+        to_llm.with_tool(tool)
+        self
+      end
+      def with_tools(*tools)
+        to_llm.with_tools(*tools)
+        self
+      end
+      def with_model(model_id, provider: nil)
+        to_llm.with_model(model_id, provider: provider)
+        self
+      end
+      def with_temperature(temperature)
+        to_llm.with_temperature(temperature)
+        self
+      end
+      def on_new_message(&)
+        to_llm.on_new_message(&)
+        self
+      end
+      def on_end_message(&)
+        to_llm.on_end_message(&)
+        self
+      end
       def ask(message, &)
         message = { role: :user, content: message }
         messages.create!(**message)

data/lib/ruby_llm/aliases.json ADDED Viewed

@@ -0,0 +1,65 @@
+{
+  "claude-3-5-sonnet": {
+    "anthropic": "claude-3-5-sonnet-20241022",
+    "bedrock": "anthropic.claude-3-5-sonnet-20241022-v2:0"
+  },
+  "claude-3-5-haiku": {
+    "anthropic": "claude-3-5-haiku-20241022",
+    "bedrock": "anthropic.claude-3-5-haiku-20241022-v1:0"
+  },
+  "claude-3-7-sonnet": {
+    "anthropic": "claude-3-7-sonnet-20250219",
+    "bedrock": "us.anthropic.claude-3-7-sonnet-20250219-v1:0"
+  },
+  "claude-3-opus": {
+    "anthropic": "claude-3-opus-20240229",
+    "bedrock": "anthropic.claude-3-opus-20240229-v1:0"
+  },
+  "claude-3-sonnet": {
+    "anthropic": "claude-3-sonnet-20240229",
+    "bedrock": "anthropic.claude-3-sonnet-20240229-v1:0"
+  },
+  "claude-3-haiku": {
+    "anthropic": "claude-3-haiku-20240307",
+    "bedrock": "anthropic.claude-3-haiku-20240307-v1:0"
+  },
+  "claude-3": {
+    "anthropic": "claude-3-sonnet-20240229",
+    "bedrock": "anthropic.claude-3-sonnet-20240229-v1:0"
+  },
+  "claude-2": {
+    "anthropic": "claude-2.0",
+    "bedrock": "anthropic.claude-2.0"
+  },
+  "claude-2-1": {
+    "anthropic": "claude-2.1",
+    "bedrock": "anthropic.claude-2.1"
+  },
+  "gpt-4o": {
+    "openai": "gpt-4o-2024-11-20"
+  },
+  "gpt-4o-mini": {
+    "openai": "gpt-4o-mini-2024-07-18"
+  },
+  "gpt-4-turbo": {
+    "openai": "gpt-4-turbo-2024-04-09"
+  },
+  "gemini-1.5-flash": {
+    "gemini": "gemini-1.5-flash-002"
+  },
+  "gemini-1.5-flash-8b": {
+    "gemini": "gemini-1.5-flash-8b-001"
+  },
+  "gemini-1.5-pro": {
+    "gemini": "gemini-1.5-pro-002"
+  },
+  "gemini-2.0-flash": {
+    "gemini": "gemini-2.0-flash-001"
+  },
+  "o1": {
+    "openai": "o1-2024-12-17"
+  },
+  "o3-mini": {
+    "openai": "o3-mini-2025-01-31"
+  }
+}

data/lib/ruby_llm/aliases.rb ADDED Viewed

@@ -0,0 +1,56 @@
+# frozen_string_literal: true
+module RubyLLM
+  # Manages model aliases, allowing users to reference models by simpler names
+  # that map to specific model versions across different providers.
+  #
+  # Aliases are defined in aliases.json and follow the format:
+  #   {
+  #     "simple-name": {
+  #       "provider1": "specific-version-for-provider1",
+  #       "provider2": "specific-version-for-provider2"
+  #     }
+  #   }
+  class Aliases
+    class << self
+      # Resolves a model ID to its provider-specific version
+      #
+      # @param model_id [String] the model identifier or alias
+      # @param provider_slug [String, Symbol, nil] optional provider to resolve for
+      # @return [String] the resolved model ID or the original if no alias exists
+      def resolve(model_id, provider = nil)
+        return model_id unless aliases[model_id]
+        if provider
+          aliases[model_id][provider.to_s] || model_id
+        else
+          # Get native provider's version
+          aliases[model_id].values.first || model_id
+        end
+      end
+      # Returns the loaded aliases mapping
+      # @return [Hash] the aliases mapping
+      def aliases
+        @aliases ||= load_aliases
+      end
+      # Loads aliases from the JSON file
+      # @return [Hash] the loaded aliases
+      def load_aliases
+        file_path = File.expand_path('aliases.json', __dir__)
+        if File.exist?(file_path)
+          JSON.parse(File.read(file_path))
+        else
+          {}
+        end
+      end
+      # Reloads aliases from disk
+      # @return [Hash] the reloaded aliases
+      def reload!
+        @aliases = load_aliases
+      end
+    end
+  end
+end

data/lib/ruby_llm/chat.rb CHANGED Viewed

@@ -13,9 +13,9 @@ module RubyLLM
     attr_reader :model, :messages, :tools
-    def initialize(model: nil)
+    def initialize(model: nil, provider: nil)
       model_id = model || RubyLLM.config.default_model
-      self.model = model_id
+      with_model(model_id, provider: provider)
       @temperature = 0.7
       @messages = []
       @tools = {}
@@ -32,6 +32,11 @@ module RubyLLM
     alias say ask
+    def with_instructions(instructions)
+      add_message role: :system, content: instructions
+      self
+    end
     def with_tool(tool)
       unless @model.supports_functions
         raise UnsupportedFunctionsError, "Model #{@model.id} doesn't support function calling"
@@ -47,13 +52,9 @@ module RubyLLM
       self
     end
-    def model=(model_id)
-      @model = Models.find model_id
-      @provider = Models.provider_for model_id
-    end
-    def with_model(model_id)
-      self.model = model_id
+    def with_model(model_id, provider: nil)
+      @model = Models.find model_id, provider
+      @provider = Provider.providers[@model.provider.to_sym] || raise(Error, "Unknown provider: #{@model.provider}")
       self
     end

data/lib/ruby_llm/configuration.rb CHANGED Viewed

@@ -14,6 +14,10 @@ module RubyLLM
                   :anthropic_api_key,
                   :gemini_api_key,
                   :deepseek_api_key,
+                  :bedrock_api_key,
+                  :bedrock_secret_key,
+                  :bedrock_region,
+                  :bedrock_session_token,
                   :default_model,
                   :default_embedding_model,
                   :default_image_model,

data/lib/ruby_llm/error.rb CHANGED Viewed

@@ -19,15 +19,21 @@ module RubyLLM
     end
   end
-  class ModelNotFoundError < StandardError; end
+  # Error classes for non-HTTP errors
+  class ConfigurationError < StandardError; end
   class InvalidRoleError < StandardError; end
+  class ModelNotFoundError < StandardError; end
   class UnsupportedFunctionsError < StandardError; end
-  class UnauthorizedError < Error; end
-  class PaymentRequiredError < Error; end
-  class ServiceUnavailableError < Error; end
+  # Error classes for different HTTP status codes
   class BadRequestError < Error; end
+  class ForbiddenError < Error; end
+  class OverloadedError < Error; end
+  class PaymentRequiredError < Error; end
   class RateLimitError < Error; end
   class ServerError < Error; end
+  class ServiceUnavailableError < Error; end
+  class UnauthorizedError < Error; end
   # Faraday middleware that maps provider-specific API errors to RubyLLM errors.
   # Uses provider's parse_error method to extract meaningful error messages.
@@ -56,12 +62,17 @@ module RubyLLM
           raise UnauthorizedError.new(response, message || 'Invalid API key - check your credentials')
         when 402
           raise PaymentRequiredError.new(response, message || 'Payment required - please top up your account')
+        when 403
+          raise ForbiddenError.new(response,
+                                   message || 'Forbidden - you do not have permission to access this resource')
         when 429
           raise RateLimitError.new(response, message || 'Rate limit exceeded - please wait a moment')
         when 500
           raise ServerError.new(response, message || 'API server error - please try again')
         when 502..503
           raise ServiceUnavailableError.new(response, message || 'API server unavailable - please try again later')
+        when 529
+          raise OverloadedError.new(response, message || 'Service overloaded - please try again later')
         else
           raise Error.new(response, message || 'An unknown error occurred')
         end