RubyGems - openai - Versions diffs - 0.61.0 → 0.62.0 - Mend

openai 0.61.0 → 0.62.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (157) hide show

data/lib/openai/models/image_generate_params.rb CHANGED Viewed

@@ -19,9 +19,14 @@ module OpenAI
       # @!attribute background
       #   Allows to set transparency for the background of the generated image(s). This
-      #   parameter is only supported for the GPT image models. Must be one of
-      #   `transparent`, `opaque` or `auto` (default value). When `auto` is used, the
-      #   model will automatically determine the best background for the image.
+      #   parameter is only supported for GPT image models that support transparent
+      #   backgrounds. Must be one of `transparent`, `opaque`, or `auto` (default value).
+      #   When `auto` is used, the model will automatically determine the best background
+      #   for the image.
+      #
+      #   `gpt-image-2` and `gpt-image-2-2026-04-21` do not support transparent
+      #   backgrounds. Requests with `background` set to `transparent` will return an
+      #   error for these models; use `opaque` or `auto` instead.
       #
       #   If `transparent`, the output format needs to support transparency, so it should
       #   be set to either `png` (default value) or `webp`.
@@ -31,8 +36,9 @@ module OpenAI
       # @!attribute model
       #   The model to use for image generation. One of `dall-e-2`, `dall-e-3`, or a GPT
-      #   image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`). Defaults to
-      #   `dall-e-2` unless a parameter specific to the GPT image models is used.
+      #   image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`, `gpt-image-2`,
+      #   or `gpt-image-2-2026-04-21`). Defaults to `dall-e-2` unless a parameter specific
+      #   to the GPT image models is used.
       #
       #   @return [String, Symbol, OpenAI::Models::ImageModel, nil]
       optional :model, union: -> { OpenAI::ImageGenerateParams::Model }, nil?: true
@@ -100,13 +106,20 @@ module OpenAI
       optional :response_format, enum: -> { OpenAI::ImageGenerateParams::ResponseFormat }, nil?: true
       # @!attribute size
-      #   The size of the generated images. Must be one of `1024x1024`, `1536x1024`
-      #   (landscape), `1024x1536` (portrait), or `auto` (default value) for the GPT image
-      #   models, one of `256x256`, `512x512`, or `1024x1024` for `dall-e-2`, and one of
-      #   `1024x1024`, `1792x1024`, or `1024x1792` for `dall-e-3`.
-      #
-      #   @return [Symbol, OpenAI::Models::ImageGenerateParams::Size, nil]
-      optional :size, enum: -> { OpenAI::ImageGenerateParams::Size }, nil?: true
+      #   The size of the generated images. For `gpt-image-2` and
+      #   `gpt-image-2-2026-04-21`, arbitrary resolutions are supported as `WIDTHxHEIGHT`
+      #   strings, for example `1536x864`. Width and height must both be divisible by 16
+      #   and the requested aspect ratio must be between 1:3 and 3:1. Resolutions above
+      #   `2560x1440` are experimental, and the maximum supported resolution is
+      #   `3840x2160`. The requested size must also satisfy the model's current pixel and
+      #   edge limits. The standard sizes `1024x1024`, `1536x1024`, and `1024x1536` are
+      #   supported by the GPT image models; `auto` is supported for models that allow
+      #   automatic sizing. For `dall-e-2`, use one of `256x256`, `512x512`, or
+      #   `1024x1024`. For `dall-e-3`, use one of `1024x1024`, `1792x1024`, or
+      #   `1024x1792`.
+      #
+      #   @return [String, Symbol, OpenAI::Models::ImageGenerateParams::Size, nil]
+      optional :size, union: -> { OpenAI::ImageGenerateParams::Size }, nil?: true
       # @!attribute style
       #   The style of the generated images. This parameter is only supported for
@@ -149,7 +162,7 @@ module OpenAI
       #
       #   @param response_format [Symbol, OpenAI::Models::ImageGenerateParams::ResponseFormat, nil] The format in which generated images with `dall-e-2` and `dall-e-3` are returned
       #
-      #   @param size [Symbol, OpenAI::Models::ImageGenerateParams::Size, nil] The size of the generated images. Must be one of `1024x1024`, `1536x1024` (lands
+      #   @param size [String, Symbol, OpenAI::Models::ImageGenerateParams::Size, nil] The size of the generated images. For `gpt-image-2` and `gpt-image-2-2026-04-21`
       #
       #   @param style [Symbol, OpenAI::Models::ImageGenerateParams::Style, nil] The style of the generated images. This parameter is only supported for `dall-e-
       #
@@ -158,9 +171,14 @@ module OpenAI
       #   @param request_options [OpenAI::RequestOptions, Hash{Symbol=>Object}]
       # Allows to set transparency for the background of the generated image(s). This
-      # parameter is only supported for the GPT image models. Must be one of
-      # `transparent`, `opaque` or `auto` (default value). When `auto` is used, the
-      # model will automatically determine the best background for the image.
+      # parameter is only supported for GPT image models that support transparent
+      # backgrounds. Must be one of `transparent`, `opaque`, or `auto` (default value).
+      # When `auto` is used, the model will automatically determine the best background
+      # for the image.
+      #
+      # `gpt-image-2` and `gpt-image-2-2026-04-21` do not support transparent
+      # backgrounds. Requests with `background` set to `transparent` will return an
+      # error for these models; use `opaque` or `auto` instead.
       #
       # If `transparent`, the output format needs to support transparency, so it should
       # be set to either `png` (default value) or `webp`.
@@ -176,14 +194,15 @@ module OpenAI
       end
       # The model to use for image generation. One of `dall-e-2`, `dall-e-3`, or a GPT
-      # image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`). Defaults to
-      # `dall-e-2` unless a parameter specific to the GPT image models is used.
+      # image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`, `gpt-image-2`,
+      # or `gpt-image-2-2026-04-21`). Defaults to `dall-e-2` unless a parameter specific
+      # to the GPT image models is used.
       module Model
         extend OpenAI::Internal::Type::Union
         variant String
-        # The model to use for image generation. One of `dall-e-2`, `dall-e-3`, or a GPT image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`). Defaults to `dall-e-2` unless a parameter specific to the GPT image models is used.
+        # The model to use for image generation. One of `dall-e-2`, `dall-e-3`, or a GPT image model (`gpt-image-1`, `gpt-image-1-mini`, `gpt-image-1.5`, `gpt-image-2`, or `gpt-image-2-2026-04-21`). Defaults to `dall-e-2` unless a parameter specific to the GPT image models is used.
         variant enum: -> { OpenAI::ImageModel }
         # @!method self.variants
@@ -251,12 +270,46 @@ module OpenAI
         #   @return [Array<Symbol>]
       end
-      # The size of the generated images. Must be one of `1024x1024`, `1536x1024`
-      # (landscape), `1024x1536` (portrait), or `auto` (default value) for the GPT image
-      # models, one of `256x256`, `512x512`, or `1024x1024` for `dall-e-2`, and one of
-      # `1024x1024`, `1792x1024`, or `1024x1792` for `dall-e-3`.
+      # The size of the generated images. For `gpt-image-2` and
+      # `gpt-image-2-2026-04-21`, arbitrary resolutions are supported as `WIDTHxHEIGHT`
+      # strings, for example `1536x864`. Width and height must both be divisible by 16
+      # and the requested aspect ratio must be between 1:3 and 3:1. Resolutions above
+      # `2560x1440` are experimental, and the maximum supported resolution is
+      # `3840x2160`. The requested size must also satisfy the model's current pixel and
+      # edge limits. The standard sizes `1024x1024`, `1536x1024`, and `1024x1536` are
+      # supported by the GPT image models; `auto` is supported for models that allow
+      # automatic sizing. For `dall-e-2`, use one of `256x256`, `512x512`, or
+      # `1024x1024`. For `dall-e-3`, use one of `1024x1024`, `1792x1024`, or
+      # `1024x1792`.
       module Size
-        extend OpenAI::Internal::Type::Enum
+        extend OpenAI::Internal::Type::Union
+        variant String
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::AUTO }
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::SIZE_1024X1024 }
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::SIZE_1536X1024 }
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::SIZE_1024X1536 }
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::SIZE_256X256 }
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::SIZE_512X512 }
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::SIZE_1792X1024 }
+        variant const: -> { OpenAI::Models::ImageGenerateParams::Size::SIZE_1024X1792 }
+        # @!method self.variants
+        #   @return [Array(String, Symbol)]
+        define_sorbet_constant!(:Variants) do
+          T.type_alias { T.any(String, OpenAI::ImageGenerateParams::Size::TaggedSymbol) }
+        end
+        # @!group
         AUTO = :auto
         SIZE_1024X1024 = :"1024x1024"
@@ -267,8 +320,7 @@ module OpenAI
         SIZE_1792X1024 = :"1792x1024"
         SIZE_1024X1792 = :"1024x1792"
-        # @!method self.values
-        #   @return [Array<Symbol>]
+        # @!endgroup
       end
       # The style of the generated images. This parameter is only supported for

data/lib/openai/models/image_model.rb CHANGED Viewed

@@ -5,11 +5,14 @@ module OpenAI
     module ImageModel
       extend OpenAI::Internal::Type::Enum
+      GPT_IMAGE_1 = :"gpt-image-1"
+      GPT_IMAGE_1_MINI = :"gpt-image-1-mini"
+      GPT_IMAGE_2 = :"gpt-image-2"
+      GPT_IMAGE_2_2026_04_21 = :"gpt-image-2-2026-04-21"
       GPT_IMAGE_1_5 = :"gpt-image-1.5"
+      CHATGPT_IMAGE_LATEST = :"chatgpt-image-latest"
       DALL_E_2 = :"dall-e-2"
       DALL_E_3 = :"dall-e-3"
-      GPT_IMAGE_1 = :"gpt-image-1"
-      GPT_IMAGE_1_MINI = :"gpt-image-1-mini"
       # @!method self.values
       #   @return [Array<Symbol>]

data/lib/openai/models/realtime/audio_transcription.rb CHANGED Viewed

@@ -4,6 +4,14 @@ module OpenAI
   module Models
     module Realtime
       class AudioTranscription < OpenAI::Internal::Type::BaseModel
+        # @!attribute delay
+        #   Controls how long the model waits before emitting transcription text. Higher
+        #   values can improve transcription accuracy at the cost of latency. Only supported
+        #   with `gpt-realtime-whisper` in GA Realtime sessions.
+        #
+        #   @return [Symbol, OpenAI::Models::Realtime::AudioTranscription::Delay, nil]
+        optional :delay, enum: -> { OpenAI::Realtime::AudioTranscription::Delay }
         # @!attribute language
         #   The language of the input audio. Supplying the input language in
         #   [ISO-639-1](https://en.wikipedia.org/wiki/List_of_ISO_639-1_codes) (e.g. `en`)
@@ -15,8 +23,8 @@ module OpenAI
         # @!attribute model
         #   The model to use for transcription. Current options are `whisper-1`,
         #   `gpt-4o-mini-transcribe`, `gpt-4o-mini-transcribe-2025-12-15`,
-        #   `gpt-4o-transcribe`, and `gpt-4o-transcribe-diarize`. Use
-        #   `gpt-4o-transcribe-diarize` when you need diarization with speaker labels.
+        #   `gpt-4o-transcribe`, `gpt-4o-transcribe-diarize`, and `gpt-realtime-whisper`.
+        #   Use `gpt-4o-transcribe-diarize` when you need diarization with speaker labels.
         #
         #   @return [String, Symbol, OpenAI::Models::Realtime::AudioTranscription::Model, nil]
         optional :model, union: -> { OpenAI::Realtime::AudioTranscription::Model }
@@ -27,24 +35,45 @@ module OpenAI
         #   [prompt is a list of keywords](https://platform.openai.com/docs/guides/speech-to-text#prompting).
         #   For `gpt-4o-transcribe` models (excluding `gpt-4o-transcribe-diarize`), the
         #   prompt is a free text string, for example "expect words related to technology".
+        #   Prompt is not supported with `gpt-realtime-whisper` in GA Realtime sessions.
         #
         #   @return [String, nil]
         optional :prompt, String
-        # @!method initialize(language: nil, model: nil, prompt: nil)
+        # @!method initialize(delay: nil, language: nil, model: nil, prompt: nil)
         #   Some parameter documentations has been truncated, see
         #   {OpenAI::Models::Realtime::AudioTranscription} for more details.
         #
+        #   @param delay [Symbol, OpenAI::Models::Realtime::AudioTranscription::Delay] Controls how long the model waits before emitting transcription text.
+        #
         #   @param language [String] The language of the input audio. Supplying the input language in
         #
         #   @param model [String, Symbol, OpenAI::Models::Realtime::AudioTranscription::Model] The model to use for transcription. Current options are `whisper-1`, `gpt-4o-min
         #
         #   @param prompt [String] An optional text to guide the model's style or continue a previous audio
+        # Controls how long the model waits before emitting transcription text. Higher
+        # values can improve transcription accuracy at the cost of latency. Only supported
+        # with `gpt-realtime-whisper` in GA Realtime sessions.
+        #
+        # @see OpenAI::Models::Realtime::AudioTranscription#delay
+        module Delay
+          extend OpenAI::Internal::Type::Enum
+          MINIMAL = :minimal
+          LOW = :low
+          MEDIUM = :medium
+          HIGH = :high
+          XHIGH = :xhigh
+          # @!method self.values
+          #   @return [Array<Symbol>]
+        end
         # The model to use for transcription. Current options are `whisper-1`,
         # `gpt-4o-mini-transcribe`, `gpt-4o-mini-transcribe-2025-12-15`,
-        # `gpt-4o-transcribe`, and `gpt-4o-transcribe-diarize`. Use
-        # `gpt-4o-transcribe-diarize` when you need diarization with speaker labels.
+        # `gpt-4o-transcribe`, `gpt-4o-transcribe-diarize`, and `gpt-realtime-whisper`.
+        # Use `gpt-4o-transcribe-diarize` when you need diarization with speaker labels.
         #
         # @see OpenAI::Models::Realtime::AudioTranscription#model
         module Model
@@ -62,6 +91,8 @@ module OpenAI
           variant const: -> { OpenAI::Models::Realtime::AudioTranscription::Model::GPT_4O_TRANSCRIBE_DIARIZE }
+          variant const: -> { OpenAI::Models::Realtime::AudioTranscription::Model::GPT_REALTIME_WHISPER }
           # @!method self.variants
           #   @return [Array(String, Symbol)]
@@ -76,6 +107,7 @@ module OpenAI
           GPT_4O_MINI_TRANSCRIBE_2025_12_15 = :"gpt-4o-mini-transcribe-2025-12-15"
           GPT_4O_TRANSCRIBE = :"gpt-4o-transcribe"
           GPT_4O_TRANSCRIBE_DIARIZE = :"gpt-4o-transcribe-diarize"
+          GPT_REALTIME_WHISPER = :"gpt-realtime-whisper"
           # @!endgroup
         end

data/lib/openai/models/realtime/client_secret_create_response.rb CHANGED Viewed

@@ -43,8 +43,7 @@ module OpenAI
           discriminator :type
-          # A new Realtime session configuration, with an ephemeral key. Default TTL
-          # for keys is one minute.
+          # A Realtime session configuration object.
           variant :realtime, -> { OpenAI::Realtime::RealtimeSessionCreateResponse }
           # A Realtime transcription session configuration object.

data/lib/openai/models/realtime/realtime_audio_config_input.rb CHANGED Viewed

@@ -48,6 +48,9 @@ module OpenAI
         #   wait longer for the user to continue speaking. This can be useful for more
         #   natural conversations, but may have a higher latency.
         #
+        #   For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
+        #   `null`; VAD is not supported.
+        #
         #   @return [OpenAI::Models::Realtime::RealtimeAudioInputTurnDetection::ServerVad, OpenAI::Models::Realtime::RealtimeAudioInputTurnDetection::SemanticVad, nil]
         optional :turn_detection, union: -> { OpenAI::Realtime::RealtimeAudioInputTurnDetection }, nil?: true

data/lib/openai/models/realtime/realtime_audio_input_turn_detection.rb CHANGED Viewed

@@ -16,6 +16,9 @@ module OpenAI
       # trails off with "uhhm", the model will score a low probability of turn end and
       # wait longer for the user to continue speaking. This can be useful for more
       # natural conversations, but may have a higher latency.
+      #
+      # For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
+      # `null`; VAD is not supported.
       module RealtimeAudioInputTurnDetection
         extend OpenAI::Internal::Type::Union

data/lib/openai/models/realtime/realtime_reasoning.rb ADDED Viewed

@@ -0,0 +1,24 @@
+# frozen_string_literal: true
+module OpenAI
+  module Models
+    module Realtime
+      class RealtimeReasoning < OpenAI::Internal::Type::BaseModel
+        # @!attribute effort
+        #   Constrains effort on reasoning for reasoning-capable Realtime models such as
+        #   `gpt-realtime-2`.
+        #
+        #   @return [Symbol, OpenAI::Models::Realtime::RealtimeReasoningEffort, nil]
+        optional :effort, enum: -> { OpenAI::Realtime::RealtimeReasoningEffort }
+        # @!method initialize(effort: nil)
+        #   Some parameter documentations has been truncated, see
+        #   {OpenAI::Models::Realtime::RealtimeReasoning} for more details.
+        #
+        #   Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
+        #
+        #   @param effort [Symbol, OpenAI::Models::Realtime::RealtimeReasoningEffort] Constrains effort on reasoning for reasoning-capable Realtime models such as
+      end
+    end
+  end
+end

data/lib/openai/models/realtime/realtime_reasoning_effort.rb ADDED Viewed

@@ -0,0 +1,22 @@
+# frozen_string_literal: true
+module OpenAI
+  module Models
+    module Realtime
+      # Constrains effort on reasoning for reasoning-capable Realtime models such as
+      # `gpt-realtime-2`.
+      module RealtimeReasoningEffort
+        extend OpenAI::Internal::Type::Enum
+        MINIMAL = :minimal
+        LOW = :low
+        MEDIUM = :medium
+        HIGH = :high
+        XHIGH = :xhigh
+        # @!method self.values
+        #   @return [Array<Symbol>]
+      end
+    end
+  end
+end

data/lib/openai/models/realtime/realtime_response_create_params.rb CHANGED Viewed

@@ -73,6 +73,13 @@ module OpenAI
         optional :output_modalities,
                  -> { OpenAI::Internal::Type::ArrayOf[enum: OpenAI::Realtime::RealtimeResponseCreateParams::OutputModality] }
+        # @!attribute parallel_tool_calls
+        #   Whether the model may call multiple tools in parallel. Only supported by
+        #   reasoning Realtime models such as `gpt-realtime-2`.
+        #
+        #   @return [Boolean, nil]
+        optional :parallel_tool_calls, OpenAI::Internal::Type::Boolean
         # @!attribute prompt
         #   Reference to a prompt template and its variables.
         #   [Learn more](https://platform.openai.com/docs/guides/text?api-mode=responses#reusable-prompts).
@@ -80,6 +87,12 @@ module OpenAI
         #   @return [OpenAI::Models::Responses::ResponsePrompt, nil]
         optional :prompt, -> { OpenAI::Responses::ResponsePrompt }, nil?: true
+        # @!attribute reasoning
+        #   Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
+        #
+        #   @return [OpenAI::Models::Realtime::RealtimeReasoning, nil]
+        optional :reasoning, -> { OpenAI::Realtime::RealtimeReasoning }
         # @!attribute tool_choice
         #   How the model chooses tools. Provide one of the string modes or force a specific
         #   function/MCP tool.
@@ -94,7 +107,7 @@ module OpenAI
         optional :tools,
                  -> { OpenAI::Internal::Type::ArrayOf[union: OpenAI::Realtime::RealtimeResponseCreateParams::Tool] }
-        # @!method initialize(audio: nil, conversation: nil, input: nil, instructions: nil, max_output_tokens: nil, metadata: nil, output_modalities: nil, prompt: nil, tool_choice: nil, tools: nil)
+        # @!method initialize(audio: nil, conversation: nil, input: nil, instructions: nil, max_output_tokens: nil, metadata: nil, output_modalities: nil, parallel_tool_calls: nil, prompt: nil, reasoning: nil, tool_choice: nil, tools: nil)
         #   Some parameter documentations has been truncated, see
         #   {OpenAI::Models::Realtime::RealtimeResponseCreateParams} for more details.
         #
@@ -114,8 +127,12 @@ module OpenAI
         #
         #   @param output_modalities [Array<Symbol, OpenAI::Models::Realtime::RealtimeResponseCreateParams::OutputModality>] The set of modalities the model used to respond, currently the only possible val
         #
+        #   @param parallel_tool_calls [Boolean] Whether the model may call multiple tools in parallel. Only supported by
+        #
         #   @param prompt [OpenAI::Models::Responses::ResponsePrompt, nil] Reference to a prompt template and its variables.
         #
+        #   @param reasoning [OpenAI::Models::Realtime::RealtimeReasoning] Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
+        #
         #   @param tool_choice [Symbol, OpenAI::Models::Responses::ToolChoiceOptions, OpenAI::Models::Responses::ToolChoiceFunction, OpenAI::Models::Responses::ToolChoiceMcp] How the model chooses tools. Provide one of the string modes or force a specific
         #
         #   @param tools [Array<OpenAI::Models::Realtime::RealtimeFunctionTool, OpenAI::Models::Realtime::RealtimeResponseCreateMcpTool>] Tools available to the model.

data/lib/openai/models/realtime/realtime_session.rb CHANGED Viewed

@@ -170,6 +170,9 @@ module OpenAI
         #   wait longer for the user to continue speaking. This can be useful for more
         #   natural conversations, but may have a higher latency.
         #
+        #   For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
+        #   `null`; VAD is not supported.
+        #
         #   @return [OpenAI::Models::Realtime::RealtimeSession::TurnDetection::ServerVad, OpenAI::Models::Realtime::RealtimeSession::TurnDetection::SemanticVad, nil]
         optional :turn_detection, union: -> { OpenAI::Realtime::RealtimeSession::TurnDetection }, nil?: true
@@ -468,6 +471,9 @@ module OpenAI
         # wait longer for the user to continue speaking. This can be useful for more
         # natural conversations, but may have a higher latency.
         #
+        # For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
+        # `null`; VAD is not supported.
+        #
         # @see OpenAI::Models::Realtime::RealtimeSession#turn_detection
         module TurnDetection
           extend OpenAI::Internal::Type::Union

data/lib/openai/models/realtime/realtime_session_create_request.rb CHANGED Viewed

@@ -66,6 +66,13 @@ module OpenAI
         optional :output_modalities,
                  -> { OpenAI::Internal::Type::ArrayOf[enum: OpenAI::Realtime::RealtimeSessionCreateRequest::OutputModality] }
+        # @!attribute parallel_tool_calls
+        #   Whether the model may call multiple tools in parallel. Only supported by
+        #   reasoning Realtime models such as `gpt-realtime-2`.
+        #
+        #   @return [Boolean, nil]
+        optional :parallel_tool_calls, OpenAI::Internal::Type::Boolean
         # @!attribute prompt
         #   Reference to a prompt template and its variables.
         #   [Learn more](https://platform.openai.com/docs/guides/text?api-mode=responses#reusable-prompts).
@@ -73,6 +80,12 @@ module OpenAI
         #   @return [OpenAI::Models::Responses::ResponsePrompt, nil]
         optional :prompt, -> { OpenAI::Responses::ResponsePrompt }, nil?: true
+        # @!attribute reasoning
+        #   Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
+        #
+        #   @return [OpenAI::Models::Realtime::RealtimeReasoning, nil]
+        optional :reasoning, -> { OpenAI::Realtime::RealtimeReasoning }
         # @!attribute tool_choice
         #   How the model chooses tools. Provide one of the string modes or force a specific
         #   function/MCP tool.
@@ -121,7 +134,7 @@ module OpenAI
         #   @return [Symbol, OpenAI::Models::Realtime::RealtimeTruncation::RealtimeTruncationStrategy, OpenAI::Models::Realtime::RealtimeTruncationRetentionRatio, nil]
         optional :truncation, union: -> { OpenAI::Realtime::RealtimeTruncation }
-        # @!method initialize(audio: nil, include: nil, instructions: nil, max_output_tokens: nil, model: nil, output_modalities: nil, prompt: nil, tool_choice: nil, tools: nil, tracing: nil, truncation: nil, type: :realtime)
+        # @!method initialize(audio: nil, include: nil, instructions: nil, max_output_tokens: nil, model: nil, output_modalities: nil, parallel_tool_calls: nil, prompt: nil, reasoning: nil, tool_choice: nil, tools: nil, tracing: nil, truncation: nil, type: :realtime)
         #   Some parameter documentations has been truncated, see
         #   {OpenAI::Models::Realtime::RealtimeSessionCreateRequest} for more details.
         #
@@ -139,8 +152,12 @@ module OpenAI
         #
         #   @param output_modalities [Array<Symbol, OpenAI::Models::Realtime::RealtimeSessionCreateRequest::OutputModality>] The set of modalities the model can respond with. It defaults to `["audio"]`, in
         #
+        #   @param parallel_tool_calls [Boolean] Whether the model may call multiple tools in parallel. Only supported by
+        #
         #   @param prompt [OpenAI::Models::Responses::ResponsePrompt, nil] Reference to a prompt template and its variables.
         #
+        #   @param reasoning [OpenAI::Models::Realtime::RealtimeReasoning] Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
+        #
         #   @param tool_choice [Symbol, OpenAI::Models::Responses::ToolChoiceOptions, OpenAI::Models::Responses::ToolChoiceFunction, OpenAI::Models::Responses::ToolChoiceMcp] How the model chooses tools. Provide one of the string modes or force a specific
         #
         #   @param tools [Array<OpenAI::Models::Realtime::RealtimeFunctionTool, OpenAI::Models::Realtime::RealtimeToolsConfigUnion::Mcp>] Tools available to the model.
@@ -188,6 +205,8 @@ module OpenAI
           variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateRequest::Model::GPT_REALTIME_1_5 }
+          variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateRequest::Model::GPT_REALTIME_2 }
           variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateRequest::Model::GPT_REALTIME_2025_08_28 }
           variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateRequest::Model::GPT_4O_REALTIME_PREVIEW }
@@ -227,6 +246,7 @@ module OpenAI
           GPT_REALTIME = :"gpt-realtime"
           GPT_REALTIME_1_5 = :"gpt-realtime-1.5"
+          GPT_REALTIME_2 = :"gpt-realtime-2"
           GPT_REALTIME_2025_08_28 = :"gpt-realtime-2025-08-28"
           GPT_4O_REALTIME_PREVIEW = :"gpt-4o-realtime-preview"
           GPT_4O_REALTIME_PREVIEW_2024_10_01 = :"gpt-4o-realtime-preview-2024-10-01"

data/lib/openai/models/realtime/realtime_session_create_response.rb CHANGED Viewed

@@ -4,11 +4,17 @@ module OpenAI
   module Models
     module Realtime
       class RealtimeSessionCreateResponse < OpenAI::Internal::Type::BaseModel
-        # @!attribute client_secret
-        #   Ephemeral key returned by the API.
+        # @!attribute id
+        #   Unique identifier for the session that looks like `sess_1234567890abcdef`.
         #
-        #   @return [OpenAI::Models::Realtime::RealtimeSessionClientSecret]
-        required :client_secret, -> { OpenAI::Realtime::RealtimeSessionClientSecret }
+        #   @return [String]
+        required :id, String
+        # @!attribute object
+        #   The object type. Always `realtime.session`.
+        #
+        #   @return [Symbol, :"realtime.session"]
+        required :object, const: :"realtime.session"
         # @!attribute type
         #   The type of session to create. Always `realtime` for the Realtime API.
@@ -22,6 +28,12 @@ module OpenAI
         #   @return [OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio, nil]
         optional :audio, -> { OpenAI::Realtime::RealtimeSessionCreateResponse::Audio }
+        # @!attribute expires_at
+        #   Expiration timestamp for the session, in seconds since epoch.
+        #
+        #   @return [Integer, nil]
+        optional :expires_at, Integer
         # @!attribute include
         #   Additional fields to include in server outputs.
         #
@@ -80,6 +92,12 @@ module OpenAI
         #   @return [OpenAI::Models::Responses::ResponsePrompt, nil]
         optional :prompt, -> { OpenAI::Responses::ResponsePrompt }, nil?: true
+        # @!attribute reasoning
+        #   Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
+        #
+        #   @return [OpenAI::Models::Realtime::RealtimeReasoning, nil]
+        optional :reasoning, -> { OpenAI::Realtime::RealtimeReasoning }
         # @!attribute tool_choice
         #   How the model chooses tools. Provide one of the string modes or force a specific
         #   function/MCP tool.
@@ -129,17 +147,18 @@ module OpenAI
         #   @return [Symbol, OpenAI::Models::Realtime::RealtimeTruncation::RealtimeTruncationStrategy, OpenAI::Models::Realtime::RealtimeTruncationRetentionRatio, nil]
         optional :truncation, union: -> { OpenAI::Realtime::RealtimeTruncation }
-        # @!method initialize(client_secret:, audio: nil, include: nil, instructions: nil, max_output_tokens: nil, model: nil, output_modalities: nil, prompt: nil, tool_choice: nil, tools: nil, tracing: nil, truncation: nil, type: :realtime)
+        # @!method initialize(id:, audio: nil, expires_at: nil, include: nil, instructions: nil, max_output_tokens: nil, model: nil, output_modalities: nil, prompt: nil, reasoning: nil, tool_choice: nil, tools: nil, tracing: nil, truncation: nil, object: :"realtime.session", type: :realtime)
         #   Some parameter documentations has been truncated, see
         #   {OpenAI::Models::Realtime::RealtimeSessionCreateResponse} for more details.
         #
-        #   A new Realtime session configuration, with an ephemeral key. Default TTL for
-        #   keys is one minute.
+        #   A Realtime session configuration object.
         #
-        #   @param client_secret [OpenAI::Models::Realtime::RealtimeSessionClientSecret] Ephemeral key returned by the API.
+        #   @param id [String] Unique identifier for the session that looks like `sess_1234567890abcdef`.
         #
         #   @param audio [OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio] Configuration for input and output audio.
         #
+        #   @param expires_at [Integer] Expiration timestamp for the session, in seconds since epoch.
+        #
         #   @param include [Array<Symbol, OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Include>] Additional fields to include in server outputs.
         #
         #   @param instructions [String] The default system instructions (i.e. system message) prepended to model calls.
@@ -152,6 +171,8 @@ module OpenAI
         #
         #   @param prompt [OpenAI::Models::Responses::ResponsePrompt, nil] Reference to a prompt template and its variables.
         #
+        #   @param reasoning [OpenAI::Models::Realtime::RealtimeReasoning] Configuration for reasoning-capable Realtime models such as `gpt-realtime-2`.
+        #
         #   @param tool_choice [Symbol, OpenAI::Models::Responses::ToolChoiceOptions, OpenAI::Models::Responses::ToolChoiceFunction, OpenAI::Models::Responses::ToolChoiceMcp] How the model chooses tools. Provide one of the string modes or force a specific
         #
         #   @param tools [Array<OpenAI::Models::Realtime::RealtimeFunctionTool, OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Tool::McpTool>] Tools available to the model.
@@ -160,6 +181,8 @@ module OpenAI
         #
         #   @param truncation [Symbol, OpenAI::Models::Realtime::RealtimeTruncation::RealtimeTruncationStrategy, OpenAI::Models::Realtime::RealtimeTruncationRetentionRatio] When the number of tokens in a conversation exceeds the model's input token limi
         #
+        #   @param object [Symbol, :"realtime.session"] The object type. Always `realtime.session`.
+        #
         #   @param type [Symbol, :realtime] The type of session to create. Always `realtime` for the Realtime API.
         # @see OpenAI::Models::Realtime::RealtimeSessionCreateResponse#audio
@@ -200,14 +223,6 @@ module OpenAI
                      -> { OpenAI::Realtime::RealtimeSessionCreateResponse::Audio::Input::NoiseReduction }
             # @!attribute transcription
-            #   Configuration for input audio transcription, defaults to off and can be set to
-            #   `null` to turn off once on. Input audio transcription is not native to the
-            #   model, since the model consumes audio directly. Transcription runs
-            #   asynchronously through
-            #   [the /audio/transcriptions endpoint](https://platform.openai.com/docs/api-reference/audio/createTranscription)
-            #   and should be treated as guidance of input audio content rather than precisely
-            #   what the model heard. The client can optionally set the language and prompt for
-            #   transcription, these offer additional guidance to the transcription service.
             #
             #   @return [OpenAI::Models::Realtime::AudioTranscription, nil]
             optional :transcription, -> { OpenAI::Realtime::AudioTranscription }
@@ -227,6 +242,9 @@ module OpenAI
             #   wait longer for the user to continue speaking. This can be useful for more
             #   natural conversations, but may have a higher latency.
             #
+            #   For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
+            #   `null`; VAD is not supported.
+            #
             #   @return [OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio::Input::TurnDetection::ServerVad, OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio::Input::TurnDetection::SemanticVad, nil]
             optional :turn_detection,
                      union: -> {
@@ -243,7 +261,7 @@ module OpenAI
             #
             #   @param noise_reduction [OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio::Input::NoiseReduction] Configuration for input audio noise reduction. This can be set to `null` to turn
             #
-            #   @param transcription [OpenAI::Models::Realtime::AudioTranscription] Configuration for input audio transcription, defaults to off and can be set to `
+            #   @param transcription [OpenAI::Models::Realtime::AudioTranscription]
             #
             #   @param turn_detection [OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio::Input::TurnDetection::ServerVad, OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio::Input::TurnDetection::SemanticVad, nil] Configuration for turn detection, ether Server VAD or Semantic VAD. This can be
@@ -285,6 +303,9 @@ module OpenAI
             # wait longer for the user to continue speaking. This can be useful for more
             # natural conversations, but may have a higher latency.
             #
+            # For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
+            # `null`; VAD is not supported.
+            #
             # @see OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Audio::Input#turn_detection
             module TurnDetection
               extend OpenAI::Internal::Type::Union
@@ -597,6 +618,8 @@ module OpenAI
           variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Model::GPT_REALTIME_1_5 }
+          variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Model::GPT_REALTIME_2 }
           variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Model::GPT_REALTIME_2025_08_28 }
           variant const: -> { OpenAI::Models::Realtime::RealtimeSessionCreateResponse::Model::GPT_4O_REALTIME_PREVIEW }
@@ -636,6 +659,7 @@ module OpenAI
           GPT_REALTIME = :"gpt-realtime"
           GPT_REALTIME_1_5 = :"gpt-realtime-1.5"
+          GPT_REALTIME_2 = :"gpt-realtime-2"
           GPT_REALTIME_2025_08_28 = :"gpt-realtime-2025-08-28"
           GPT_4O_REALTIME_PREVIEW = :"gpt-4o-realtime-preview"
           GPT_4O_REALTIME_PREVIEW_2024_10_01 = :"gpt-4o-realtime-preview-2024-10-01"

data/lib/openai/models/realtime/realtime_transcription_session_audio_input.rb CHANGED Viewed

@@ -48,6 +48,9 @@ module OpenAI
         #   wait longer for the user to continue speaking. This can be useful for more
         #   natural conversations, but may have a higher latency.
         #
+        #   For `gpt-realtime-whisper` transcription sessions, turn detection must be set to
+        #   `null`; VAD is not supported.
+        #
         #   @return [OpenAI::Models::Realtime::RealtimeTranscriptionSessionAudioInputTurnDetection::ServerVad, OpenAI::Models::Realtime::RealtimeTranscriptionSessionAudioInputTurnDetection::SemanticVad, nil]
         optional :turn_detection,
                  union: -> { OpenAI::Realtime::RealtimeTranscriptionSessionAudioInputTurnDetection },