RubyGems - ruby_llm_swarm - Versions diffs - 1.9.1 - Mend

ruby_llm_swarm 1.9.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (154) hide show

checksums.yaml +7 -0
data/LICENSE +21 -0
data/README.md +175 -0
data/lib/generators/ruby_llm/chat_ui/chat_ui_generator.rb +187 -0
data/lib/generators/ruby_llm/chat_ui/templates/controllers/chats_controller.rb.tt +39 -0
data/lib/generators/ruby_llm/chat_ui/templates/controllers/messages_controller.rb.tt +24 -0
data/lib/generators/ruby_llm/chat_ui/templates/controllers/models_controller.rb.tt +14 -0
data/lib/generators/ruby_llm/chat_ui/templates/jobs/chat_response_job.rb.tt +12 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/chats/_chat.html.erb.tt +16 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/chats/_form.html.erb.tt +29 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/chats/index.html.erb.tt +16 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/chats/new.html.erb.tt +11 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/chats/show.html.erb.tt +23 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/messages/_content.html.erb.tt +1 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/messages/_form.html.erb.tt +21 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/messages/_message.html.erb.tt +13 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/messages/_tool_calls.html.erb.tt +7 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/messages/create.turbo_stream.erb.tt +9 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/models/_model.html.erb.tt +16 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/models/index.html.erb.tt +28 -0
data/lib/generators/ruby_llm/chat_ui/templates/views/models/show.html.erb.tt +18 -0
data/lib/generators/ruby_llm/generator_helpers.rb +194 -0
data/lib/generators/ruby_llm/install/install_generator.rb +106 -0
data/lib/generators/ruby_llm/install/templates/add_references_to_chats_tool_calls_and_messages_migration.rb.tt +9 -0
data/lib/generators/ruby_llm/install/templates/chat_model.rb.tt +3 -0
data/lib/generators/ruby_llm/install/templates/create_chats_migration.rb.tt +7 -0
data/lib/generators/ruby_llm/install/templates/create_messages_migration.rb.tt +16 -0
data/lib/generators/ruby_llm/install/templates/create_models_migration.rb.tt +45 -0
data/lib/generators/ruby_llm/install/templates/create_tool_calls_migration.rb.tt +20 -0
data/lib/generators/ruby_llm/install/templates/initializer.rb.tt +12 -0
data/lib/generators/ruby_llm/install/templates/message_model.rb.tt +4 -0
data/lib/generators/ruby_llm/install/templates/model_model.rb.tt +3 -0
data/lib/generators/ruby_llm/install/templates/tool_call_model.rb.tt +3 -0
data/lib/generators/ruby_llm/upgrade_to_v1_7/templates/migration.rb.tt +145 -0
data/lib/generators/ruby_llm/upgrade_to_v1_7/upgrade_to_v1_7_generator.rb +124 -0
data/lib/generators/ruby_llm/upgrade_to_v1_9/templates/add_v1_9_message_columns.rb.tt +15 -0
data/lib/generators/ruby_llm/upgrade_to_v1_9/upgrade_to_v1_9_generator.rb +49 -0
data/lib/ruby_llm/active_record/acts_as.rb +174 -0
data/lib/ruby_llm/active_record/acts_as_legacy.rb +384 -0
data/lib/ruby_llm/active_record/chat_methods.rb +350 -0
data/lib/ruby_llm/active_record/message_methods.rb +81 -0
data/lib/ruby_llm/active_record/model_methods.rb +84 -0
data/lib/ruby_llm/aliases.json +295 -0
data/lib/ruby_llm/aliases.rb +38 -0
data/lib/ruby_llm/attachment.rb +220 -0
data/lib/ruby_llm/chat.rb +816 -0
data/lib/ruby_llm/chunk.rb +6 -0
data/lib/ruby_llm/configuration.rb +78 -0
data/lib/ruby_llm/connection.rb +126 -0
data/lib/ruby_llm/content.rb +73 -0
data/lib/ruby_llm/context.rb +29 -0
data/lib/ruby_llm/embedding.rb +29 -0
data/lib/ruby_llm/error.rb +84 -0
data/lib/ruby_llm/image.rb +49 -0
data/lib/ruby_llm/message.rb +86 -0
data/lib/ruby_llm/mime_type.rb +71 -0
data/lib/ruby_llm/model/info.rb +111 -0
data/lib/ruby_llm/model/modalities.rb +22 -0
data/lib/ruby_llm/model/pricing.rb +48 -0
data/lib/ruby_llm/model/pricing_category.rb +46 -0
data/lib/ruby_llm/model/pricing_tier.rb +33 -0
data/lib/ruby_llm/model.rb +7 -0
data/lib/ruby_llm/models.json +33198 -0
data/lib/ruby_llm/models.rb +231 -0
data/lib/ruby_llm/models_schema.json +168 -0
data/lib/ruby_llm/moderation.rb +56 -0
data/lib/ruby_llm/provider.rb +243 -0
data/lib/ruby_llm/providers/anthropic/capabilities.rb +134 -0
data/lib/ruby_llm/providers/anthropic/chat.rb +125 -0
data/lib/ruby_llm/providers/anthropic/content.rb +44 -0
data/lib/ruby_llm/providers/anthropic/embeddings.rb +20 -0
data/lib/ruby_llm/providers/anthropic/media.rb +92 -0
data/lib/ruby_llm/providers/anthropic/models.rb +63 -0
data/lib/ruby_llm/providers/anthropic/streaming.rb +45 -0
data/lib/ruby_llm/providers/anthropic/tools.rb +109 -0
data/lib/ruby_llm/providers/anthropic.rb +36 -0
data/lib/ruby_llm/providers/bedrock/capabilities.rb +167 -0
data/lib/ruby_llm/providers/bedrock/chat.rb +63 -0
data/lib/ruby_llm/providers/bedrock/media.rb +61 -0
data/lib/ruby_llm/providers/bedrock/models.rb +98 -0
data/lib/ruby_llm/providers/bedrock/signing.rb +831 -0
data/lib/ruby_llm/providers/bedrock/streaming/base.rb +51 -0
data/lib/ruby_llm/providers/bedrock/streaming/content_extraction.rb +71 -0
data/lib/ruby_llm/providers/bedrock/streaming/message_processing.rb +67 -0
data/lib/ruby_llm/providers/bedrock/streaming/payload_processing.rb +80 -0
data/lib/ruby_llm/providers/bedrock/streaming/prelude_handling.rb +78 -0
data/lib/ruby_llm/providers/bedrock/streaming.rb +18 -0
data/lib/ruby_llm/providers/bedrock.rb +82 -0
data/lib/ruby_llm/providers/deepseek/capabilities.rb +130 -0
data/lib/ruby_llm/providers/deepseek/chat.rb +16 -0
data/lib/ruby_llm/providers/deepseek.rb +30 -0
data/lib/ruby_llm/providers/gemini/capabilities.rb +281 -0
data/lib/ruby_llm/providers/gemini/chat.rb +454 -0
data/lib/ruby_llm/providers/gemini/embeddings.rb +37 -0
data/lib/ruby_llm/providers/gemini/images.rb +47 -0
data/lib/ruby_llm/providers/gemini/media.rb +112 -0
data/lib/ruby_llm/providers/gemini/models.rb +40 -0
data/lib/ruby_llm/providers/gemini/streaming.rb +61 -0
data/lib/ruby_llm/providers/gemini/tools.rb +198 -0
data/lib/ruby_llm/providers/gemini/transcription.rb +116 -0
data/lib/ruby_llm/providers/gemini.rb +37 -0
data/lib/ruby_llm/providers/gpustack/chat.rb +27 -0
data/lib/ruby_llm/providers/gpustack/media.rb +46 -0
data/lib/ruby_llm/providers/gpustack/models.rb +90 -0
data/lib/ruby_llm/providers/gpustack.rb +34 -0
data/lib/ruby_llm/providers/mistral/capabilities.rb +155 -0
data/lib/ruby_llm/providers/mistral/chat.rb +24 -0
data/lib/ruby_llm/providers/mistral/embeddings.rb +33 -0
data/lib/ruby_llm/providers/mistral/models.rb +48 -0
data/lib/ruby_llm/providers/mistral.rb +32 -0
data/lib/ruby_llm/providers/ollama/chat.rb +27 -0
data/lib/ruby_llm/providers/ollama/media.rb +46 -0
data/lib/ruby_llm/providers/ollama/models.rb +36 -0
data/lib/ruby_llm/providers/ollama.rb +30 -0
data/lib/ruby_llm/providers/openai/capabilities.rb +299 -0
data/lib/ruby_llm/providers/openai/chat.rb +88 -0
data/lib/ruby_llm/providers/openai/embeddings.rb +33 -0
data/lib/ruby_llm/providers/openai/images.rb +38 -0
data/lib/ruby_llm/providers/openai/media.rb +81 -0
data/lib/ruby_llm/providers/openai/models.rb +39 -0
data/lib/ruby_llm/providers/openai/moderation.rb +34 -0
data/lib/ruby_llm/providers/openai/streaming.rb +46 -0
data/lib/ruby_llm/providers/openai/tools.rb +98 -0
data/lib/ruby_llm/providers/openai/transcription.rb +70 -0
data/lib/ruby_llm/providers/openai.rb +44 -0
data/lib/ruby_llm/providers/openai_responses.rb +395 -0
data/lib/ruby_llm/providers/openrouter/models.rb +73 -0
data/lib/ruby_llm/providers/openrouter.rb +26 -0
data/lib/ruby_llm/providers/perplexity/capabilities.rb +137 -0
data/lib/ruby_llm/providers/perplexity/chat.rb +16 -0
data/lib/ruby_llm/providers/perplexity/models.rb +42 -0
data/lib/ruby_llm/providers/perplexity.rb +48 -0
data/lib/ruby_llm/providers/vertexai/chat.rb +14 -0
data/lib/ruby_llm/providers/vertexai/embeddings.rb +32 -0
data/lib/ruby_llm/providers/vertexai/models.rb +130 -0
data/lib/ruby_llm/providers/vertexai/streaming.rb +14 -0
data/lib/ruby_llm/providers/vertexai/transcription.rb +16 -0
data/lib/ruby_llm/providers/vertexai.rb +55 -0
data/lib/ruby_llm/railtie.rb +35 -0
data/lib/ruby_llm/responses_session.rb +77 -0
data/lib/ruby_llm/stream_accumulator.rb +101 -0
data/lib/ruby_llm/streaming.rb +153 -0
data/lib/ruby_llm/tool.rb +209 -0
data/lib/ruby_llm/tool_call.rb +22 -0
data/lib/ruby_llm/tool_executors.rb +125 -0
data/lib/ruby_llm/transcription.rb +35 -0
data/lib/ruby_llm/utils.rb +91 -0
data/lib/ruby_llm/version.rb +5 -0
data/lib/ruby_llm.rb +140 -0
data/lib/tasks/models.rake +525 -0
data/lib/tasks/release.rake +67 -0
data/lib/tasks/ruby_llm.rake +15 -0
data/lib/tasks/vcr.rake +92 -0
metadata +346 -0

data/lib/ruby_llm/providers/openai/capabilities.rb ADDED Viewed

@@ -0,0 +1,299 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Determines capabilities and pricing for OpenAI models
+      module Capabilities
+        module_function
+        MODEL_PATTERNS = {
+          dall_e: /^dall-e/,
+          chatgpt4o: /^chatgpt-4o/,
+          gpt41: /^gpt-4\.1(?!-(?:mini|nano))/,
+          gpt41_mini: /^gpt-4\.1-mini/,
+          gpt41_nano: /^gpt-4\.1-nano/,
+          gpt4: /^gpt-4(?:-\d{6})?$/,
+          gpt4_turbo: /^gpt-4(?:\.5)?-(?:\d{6}-)?(preview|turbo)/,
+          gpt35_turbo: /^gpt-3\.5-turbo/,
+          gpt4o: /^gpt-4o(?!-(?:mini|audio|realtime|transcribe|tts|search))/,
+          gpt4o_audio: /^gpt-4o-(?:audio)/,
+          gpt4o_mini: /^gpt-4o-mini(?!-(?:audio|realtime|transcribe|tts|search))/,
+          gpt4o_mini_audio: /^gpt-4o-mini-audio/,
+          gpt4o_mini_realtime: /^gpt-4o-mini-realtime/,
+          gpt4o_mini_transcribe: /^gpt-4o-mini-transcribe/,
+          gpt4o_mini_tts: /^gpt-4o-mini-tts/,
+          gpt4o_realtime: /^gpt-4o-realtime/,
+          gpt4o_search: /^gpt-4o-search/,
+          gpt4o_transcribe: /^gpt-4o-transcribe/,
+          gpt5: /^gpt-5/,
+          gpt5_mini: /^gpt-5-mini/,
+          gpt5_nano: /^gpt-5-nano/,
+          o1: /^o1(?!-(?:mini|pro))/,
+          o1_mini: /^o1-mini/,
+          o1_pro: /^o1-pro/,
+          o3_mini: /^o3-mini/,
+          babbage: /^babbage/,
+          davinci: /^davinci/,
+          embedding3_large: /^text-embedding-3-large/,
+          embedding3_small: /^text-embedding-3-small/,
+          embedding_ada: /^text-embedding-ada/,
+          tts1: /^tts-1(?!-hd)/,
+          tts1_hd: /^tts-1-hd/,
+          whisper: /^whisper/,
+          moderation: /^(?:omni|text)-moderation/
+        }.freeze
+        def context_window_for(model_id)
+          case model_family(model_id)
+          when 'gpt41', 'gpt41_mini', 'gpt41_nano' then 1_047_576
+          when 'gpt5', 'gpt5_mini', 'gpt5_nano', 'chatgpt4o', 'gpt4_turbo', 'gpt4o', 'gpt4o_audio', 'gpt4o_mini',
+               'gpt4o_mini_audio', 'gpt4o_mini_realtime', 'gpt4o_realtime',
+               'gpt4o_search', 'gpt4o_transcribe', 'gpt4o_mini_search', 'o1_mini' then 128_000
+          when 'gpt4' then 8_192
+          when 'gpt4o_mini_transcribe' then 16_000
+          when 'o1', 'o1_pro', 'o3_mini' then 200_000
+          when 'gpt35_turbo' then 16_385
+          when 'gpt4o_mini_tts', 'tts1', 'tts1_hd', 'whisper', 'moderation',
+               'embedding3_large', 'embedding3_small', 'embedding_ada' then nil
+          else 4_096
+          end
+        end
+        def max_tokens_for(model_id)
+          case model_family(model_id)
+          when 'gpt5', 'gpt5_mini', 'gpt5_nano' then 400_000
+          when 'gpt41', 'gpt41_mini', 'gpt41_nano' then 32_768
+          when 'chatgpt4o', 'gpt4o', 'gpt4o_mini', 'gpt4o_mini_search' then 16_384
+          when 'babbage', 'davinci' then 16_384 # rubocop:disable Lint/DuplicateBranch
+          when 'gpt4' then 8_192
+          when 'gpt35_turbo' then 4_096
+          when 'gpt4_turbo', 'gpt4o_realtime', 'gpt4o_mini_realtime' then 4_096 # rubocop:disable Lint/DuplicateBranch
+          when 'gpt4o_mini_transcribe' then 2_000
+          when 'o1', 'o1_pro', 'o3_mini' then 100_000
+          when 'o1_mini' then 65_536
+          when 'gpt4o_mini_tts', 'tts1', 'tts1_hd', 'whisper', 'moderation',
+               'embedding3_large', 'embedding3_small', 'embedding_ada' then nil
+          else 16_384 # rubocop:disable Lint/DuplicateBranch
+          end
+        end
+        def supports_vision?(model_id)
+          case model_family(model_id)
+          when 'gpt5', 'gpt5_mini', 'gpt5_nano', 'gpt41', 'gpt41_mini', 'gpt41_nano', 'chatgpt4o', 'gpt4',
+               'gpt4_turbo', 'gpt4o', 'gpt4o_mini', 'o1', 'o1_pro', 'moderation', 'gpt4o_search',
+               'gpt4o_mini_search' then true
+          else false
+          end
+        end
+        def supports_functions?(model_id)
+          case model_family(model_id)
+          when 'gpt5', 'gpt5_mini', 'gpt5_nano', 'gpt41', 'gpt41_mini', 'gpt41_nano', 'gpt4', 'gpt4_turbo', 'gpt4o',
+               'gpt4o_mini', 'o1', 'o1_pro', 'o3_mini' then true
+          when 'chatgpt4o', 'gpt35_turbo', 'o1_mini', 'gpt4o_mini_tts',
+               'gpt4o_transcribe', 'gpt4o_search', 'gpt4o_mini_search' then false
+          else false # rubocop:disable Lint/DuplicateBranch
+          end
+        end
+        def supports_structured_output?(model_id)
+          case model_family(model_id)
+          when 'gpt5', 'gpt5_mini', 'gpt5_nano', 'gpt41', 'gpt41_mini', 'gpt41_nano', 'chatgpt4o', 'gpt4o',
+               'gpt4o_mini', 'o1', 'o1_pro', 'o3_mini' then true
+          else false
+          end
+        end
+        def supports_json_mode?(model_id)
+          supports_structured_output?(model_id)
+        end
+        PRICES = {
+          gpt5: { input: 1.25, output: 10.0, cached_input: 0.125 },
+          gpt5_mini: { input: 0.25, output: 2.0, cached_input: 0.025 },
+          gpt5_nano: { input: 0.05, output: 0.4, cached_input: 0.005 },
+          gpt41: { input: 2.0, output: 8.0, cached_input: 0.5 },
+          gpt41_mini: { input: 0.4, output: 1.6, cached_input: 0.1 },
+          gpt41_nano: { input: 0.1, output: 0.4 },
+          chatgpt4o: { input: 5.0, output: 15.0 },
+          gpt4: { input: 10.0, output: 30.0 },
+          gpt4_turbo: { input: 10.0, output: 30.0 },
+          gpt45: { input: 75.0, output: 150.0 },
+          gpt35_turbo: { input: 0.5, output: 1.5 },
+          gpt4o: { input: 2.5, output: 10.0 },
+          gpt4o_audio: { input: 2.5, output: 10.0, audio_input: 40.0, audio_output: 80.0 },
+          gpt4o_mini: { input: 0.15, output: 0.6 },
+          gpt4o_mini_audio: { input: 0.15, output: 0.6, audio_input: 10.0, audio_output: 20.0 },
+          gpt4o_mini_realtime: { input: 0.6, output: 2.4 },
+          gpt4o_mini_transcribe: { input: 1.25, output: 5.0, audio_input: 3.0 },
+          gpt4o_mini_tts: { input: 0.6, output: 12.0 },
+          gpt4o_realtime: { input: 5.0, output: 20.0 },
+          gpt4o_search: { input: 2.5, output: 10.0 },
+          gpt4o_transcribe: { input: 2.5, output: 10.0, audio_input: 6.0 },
+          o1: { input: 15.0, output: 60.0 },
+          o1_mini: { input: 1.1, output: 4.4 },
+          o1_pro: { input: 150.0, output: 600.0 },
+          o3_mini: { input: 1.1, output: 4.4 },
+          babbage: { input: 0.4, output: 0.4 },
+          davinci: { input: 2.0, output: 2.0 },
+          embedding3_large: { price: 0.13 },
+          embedding3_small: { price: 0.02 },
+          embedding_ada: { price: 0.10 },
+          tts1: { price: 15.0 },
+          tts1_hd: { price: 30.0 },
+          whisper: { price: 0.006 },
+          moderation: { price: 0.0 }
+        }.freeze
+        def model_family(model_id)
+          MODEL_PATTERNS.each do |family, pattern|
+            return family.to_s if model_id.match?(pattern)
+          end
+          'other'
+        end
+        def input_price_for(model_id)
+          family = model_family(model_id).to_sym
+          prices = PRICES.fetch(family, { input: default_input_price })
+          prices[:input] || prices[:price] || default_input_price
+        end
+        def cached_input_price_for(model_id)
+          family = model_family(model_id).to_sym
+          prices = PRICES.fetch(family, {})
+          prices[:cached_input]
+        end
+        def output_price_for(model_id)
+          family = model_family(model_id).to_sym
+          prices = PRICES.fetch(family, { output: default_output_price })
+          prices[:output] || prices[:price] || default_output_price
+        end
+        def model_type(model_id)
+          case model_family(model_id)
+          when /embedding/ then 'embedding'
+          when /^tts|whisper|gpt4o_(?:mini_)?(?:transcribe|tts)$/ then 'audio'
+          when 'moderation' then 'moderation'
+          when /dall/ then 'image'
+          else 'chat'
+          end
+        end
+        def default_input_price
+          0.50
+        end
+        def default_output_price
+          1.50
+        end
+        def format_display_name(model_id)
+          model_id.then { |id| humanize(id) }
+                  .then { |name| apply_special_formatting(name) }
+        end
+        def humanize(id)
+          id.tr('-', ' ')
+            .split
+            .map(&:capitalize)
+            .join(' ')
+        end
+        def apply_special_formatting(name)
+          name
+            .gsub(/(\d{4}) (\d{2}) (\d{2})/, '\1\2\3')
+            .gsub(/^(?:Gpt|Chatgpt|Tts|Dall E) /) { |m| special_prefix_format(m.strip) }
+            .gsub(/^O([13]) /, 'O\1-')
+            .gsub(/^O[13] Mini/, '\0'.tr(' ', '-'))
+            .gsub(/\d\.\d /, '\0'.sub(' ', '-'))
+            .gsub(/4o (?=Mini|Preview|Turbo|Audio|Realtime|Transcribe|Tts)/, '4o-')
+            .gsub(/\bHd\b/, 'HD')
+            .gsub(/(?:Omni|Text) Moderation/, '\0'.tr(' ', '-'))
+            .gsub('Text Embedding', 'text-embedding-')
+        end
+        def special_prefix_format(prefix)
+          case prefix # rubocop:disable Style/HashLikeCase
+          when 'Gpt' then 'GPT-'
+          when 'Chatgpt' then 'ChatGPT-'
+          when 'Tts' then 'TTS-'
+          when 'Dall E' then 'DALL-E-'
+          end
+        end
+        def self.normalize_temperature(temperature, model_id)
+          if model_id.match?(/^(o\d|gpt-5)/)
+            RubyLLM.logger.debug "Model #{model_id} requires temperature=1.0, ignoring provided value"
+            1.0
+          elsif model_id.match?(/-search/)
+            RubyLLM.logger.debug "Model #{model_id} does not accept temperature parameter, removing"
+            nil
+          else
+            temperature
+          end
+        end
+        def modalities_for(model_id)
+          modalities = {
+            input: ['text'],
+            output: ['text']
+          }
+          # Vision support
+          modalities[:input] << 'image' if supports_vision?(model_id)
+          modalities[:input] << 'audio' if model_id.match?(/whisper|audio|tts|transcribe/)
+          modalities[:input] << 'pdf' if supports_vision?(model_id)
+          modalities[:output] << 'audio' if model_id.match?(/tts|audio/)
+          modalities[:output] << 'image' if model_id.match?(/dall-e|image/)
+          modalities[:output] << 'embeddings' if model_id.match?(/embedding/)
+          modalities[:output] << 'moderation' if model_id.match?(/moderation/)
+          modalities
+        end
+        def capabilities_for(model_id) # rubocop:disable Metrics/PerceivedComplexity
+          capabilities = []
+          capabilities << 'streaming' unless model_id.match?(/moderation|embedding/)
+          capabilities << 'function_calling' if supports_functions?(model_id)
+          capabilities << 'structured_output' if supports_json_mode?(model_id)
+          capabilities << 'batch' if model_id.match?(/embedding|batch/)
+          capabilities << 'reasoning' if model_id.match?(/o\d|gpt-5|codex/)
+          if model_id.match?(/gpt-4-turbo|gpt-4o/)
+            capabilities << 'image_generation' if model_id.match?(/vision/)
+            capabilities << 'speech_generation' if model_id.match?(/audio/)
+            capabilities << 'transcription' if model_id.match?(/audio/)
+          end
+          capabilities
+        end
+        def pricing_for(model_id)
+          standard_pricing = {
+            input_per_million: input_price_for(model_id),
+            output_per_million: output_price_for(model_id)
+          }
+          if respond_to?(:cached_input_price_for)
+            cached_price = cached_input_price_for(model_id)
+            standard_pricing[:cached_input_per_million] = cached_price if cached_price
+          end
+          pricing = { text_tokens: { standard: standard_pricing } }
+          if model_id.match?(/embedding|batch/)
+            pricing[:text_tokens][:batch] = {
+              input_per_million: standard_pricing[:input_per_million] * 0.5,
+              output_per_million: standard_pricing[:output_per_million] * 0.5
+            }
+          end
+          pricing
+        end
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/openai/chat.rb ADDED Viewed

@@ -0,0 +1,88 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Chat methods of the OpenAI API integration
+      module Chat
+        def completion_url
+          'chat/completions'
+        end
+        module_function
+        def render_payload(messages, tools:, temperature:, model:, stream: false, schema: nil) # rubocop:disable Metrics/ParameterLists
+          payload = {
+            model: model.id,
+            messages: format_messages(messages),
+            stream: stream
+          }
+          payload[:temperature] = temperature unless temperature.nil?
+          payload[:tools] = tools.map { |_, tool| tool_for(tool) } if tools.any?
+          if schema
+            strict = schema[:strict] != false
+            payload[:response_format] = {
+              type: 'json_schema',
+              json_schema: {
+                name: 'response',
+                schema: schema,
+                strict: strict
+              }
+            }
+          end
+          payload[:stream_options] = { include_usage: true } if stream
+          payload
+        end
+        def parse_completion_response(response)
+          data = response.body
+          return if data.empty?
+          raise Error.new(response, data.dig('error', 'message')) if data.dig('error', 'message')
+          message_data = data.dig('choices', 0, 'message')
+          return unless message_data
+          usage = data['usage'] || {}
+          cached_tokens = usage.dig('prompt_tokens_details', 'cached_tokens')
+          Message.new(
+            role: :assistant,
+            content: message_data['content'],
+            tool_calls: parse_tool_calls(message_data['tool_calls']),
+            input_tokens: usage['prompt_tokens'],
+            output_tokens: usage['completion_tokens'],
+            cached_tokens: cached_tokens,
+            cache_creation_tokens: 0,
+            model_id: data['model'],
+            raw: response
+          )
+        end
+        def format_messages(messages)
+          messages.map do |msg|
+            {
+              role: format_role(msg.role),
+              content: Media.format_content(msg.content),
+              tool_calls: format_tool_calls(msg.tool_calls),
+              tool_call_id: msg.tool_call_id
+            }.compact
+          end
+        end
+        def format_role(role)
+          case role
+          when :system
+            @config.openai_use_system_role ? 'system' : 'developer'
+          else
+            role.to_s
+          end
+        end
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/openai/embeddings.rb ADDED Viewed

@@ -0,0 +1,33 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Embeddings methods of the OpenAI API integration
+      module Embeddings
+        module_function
+        def embedding_url(...)
+          'embeddings'
+        end
+        def render_embedding_payload(text, model:, dimensions:)
+          {
+            model: model,
+            input: text,
+            dimensions: dimensions
+          }.compact
+        end
+        def parse_embedding_response(response, model:, text:)
+          data = response.body
+          input_tokens = data.dig('usage', 'prompt_tokens') || 0
+          vectors = data['data'].map { |d| d['embedding'] }
+          vectors = vectors.first if vectors.length == 1 && !text.is_a?(Array)
+          Embedding.new(vectors:, model:, input_tokens:)
+        end
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/openai/images.rb ADDED Viewed

@@ -0,0 +1,38 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Image generation methods for the OpenAI API integration
+      module Images
+        module_function
+        def images_url
+          'images/generations'
+        end
+        def render_image_payload(prompt, model:, size:)
+          {
+            model: model,
+            prompt: prompt,
+            n: 1,
+            size: size
+          }
+        end
+        def parse_image_response(response, model:)
+          data = response.body
+          image_data = data['data'].first
+          Image.new(
+            url: image_data['url'],
+            mime_type: 'image/png', # DALL-E typically returns PNGs
+            revised_prompt: image_data['revised_prompt'],
+            model_id: model,
+            data: image_data['b64_json']
+          )
+        end
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/openai/media.rb ADDED Viewed

@@ -0,0 +1,81 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Handles formatting of media content (images, audio) for OpenAI APIs
+      module Media
+        module_function
+        def format_content(content) # rubocop:disable Metrics/PerceivedComplexity
+          return content.value if content.is_a?(RubyLLM::Content::Raw)
+          return content.to_json if content.is_a?(Hash) || content.is_a?(Array)
+          return content unless content.is_a?(Content)
+          parts = []
+          parts << format_text(content.text) if content.text
+          content.attachments.each do |attachment|
+            case attachment.type
+            when :image
+              parts << format_image(attachment)
+            when :pdf
+              parts << format_pdf(attachment)
+            when :audio
+              parts << format_audio(attachment)
+            when :text
+              parts << format_text_file(attachment)
+            else
+              raise UnsupportedAttachmentError, attachment.type
+            end
+          end
+          parts
+        end
+        def format_image(image)
+          {
+            type: 'image_url',
+            image_url: {
+              url: image.url? ? image.source : image.for_llm
+            }
+          }
+        end
+        def format_pdf(pdf)
+          {
+            type: 'file',
+            file: {
+              filename: pdf.filename,
+              file_data: pdf.for_llm
+            }
+          }
+        end
+        def format_text_file(text_file)
+          {
+            type: 'text',
+            text: text_file.for_llm
+          }
+        end
+        def format_audio(audio)
+          {
+            type: 'input_audio',
+            input_audio: {
+              data: audio.encoded,
+              format: audio.format
+            }
+          }
+        end
+        def format_text(text)
+          {
+            type: 'text',
+            text: text
+          }
+        end
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/openai/models.rb ADDED Viewed

@@ -0,0 +1,39 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Models methods of the OpenAI API integration
+      module Models
+        module_function
+        def models_url
+          'models'
+        end
+        def parse_list_models_response(response, slug, capabilities)
+          Array(response.body['data']).map do |model_data|
+            model_id = model_data['id']
+            Model::Info.new(
+              id: model_id,
+              name: capabilities.format_display_name(model_id),
+              provider: slug,
+              family: capabilities.model_family(model_id),
+              created_at: model_data['created'] ? Time.at(model_data['created']) : nil,
+              context_window: capabilities.context_window_for(model_id),
+              max_output_tokens: capabilities.max_tokens_for(model_id),
+              modalities: capabilities.modalities_for(model_id),
+              capabilities: capabilities.capabilities_for(model_id),
+              pricing: capabilities.pricing_for(model_id),
+              metadata: {
+                object: model_data['object'],
+                owned_by: model_data['owned_by']
+              }
+            )
+          end
+        end
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/openai/moderation.rb ADDED Viewed

@@ -0,0 +1,34 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Moderation methods of the OpenAI API integration
+      module Moderation
+        module_function
+        def moderation_url
+          'moderations'
+        end
+        def render_moderation_payload(input, model:)
+          {
+            model: model,
+            input: input
+          }
+        end
+        def parse_moderation_response(response, model:)
+          data = response.body
+          raise Error.new(response, data.dig('error', 'message')) if data.dig('error', 'message')
+          RubyLLM::Moderation.new(
+            id: data['id'],
+            model: model,
+            results: data['results'] || []
+          )
+        end
+      end
+    end
+  end
+end

data/lib/ruby_llm/providers/openai/streaming.rb ADDED Viewed

@@ -0,0 +1,46 @@
+# frozen_string_literal: true
+module RubyLLM
+  module Providers
+    class OpenAI
+      # Streaming methods of the OpenAI API integration
+      module Streaming
+        module_function
+        def stream_url
+          completion_url
+        end
+        def build_chunk(data)
+          usage = data['usage'] || {}
+          cached_tokens = usage.dig('prompt_tokens_details', 'cached_tokens')
+          Chunk.new(
+            role: :assistant,
+            model_id: data['model'],
+            content: data.dig('choices', 0, 'delta', 'content'),
+            tool_calls: parse_tool_calls(data.dig('choices', 0, 'delta', 'tool_calls'), parse_arguments: false),
+            input_tokens: usage['prompt_tokens'],
+            output_tokens: usage['completion_tokens'],
+            cached_tokens: cached_tokens,
+            cache_creation_tokens: 0
+          )
+        end
+        def parse_streaming_error(data)
+          error_data = JSON.parse(data)
+          return unless error_data['error']
+          case error_data.dig('error', 'type')
+          when 'server_error'
+            [500, error_data['error']['message']]
+          when 'rate_limit_exceeded', 'insufficient_quota'
+            [429, error_data['error']['message']]
+          else
+            [400, error_data['error']['message']]
+          end
+        end
+      end
+    end
+  end
+end