RubyGems - openai - Versions diffs - 0.22.1 → 0.23.0 - Mend

openai 0.22.1 → 0.23.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (158) hide show

data/rbi/openai/models/realtime/client_secret_create_response.rbi CHANGED Viewed

@@ -35,7 +35,7 @@ module OpenAI
             session:
               T.any(
                 OpenAI::Realtime::RealtimeSessionCreateResponse::OrHash,
-                OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::OrHash
+                OpenAI::Realtime::RealtimeTranscriptionSessionCreateResponse::OrHash
               ),
             value: String
           ).returns(T.attached_class)
@@ -71,595 +71,10 @@ module OpenAI
             T.type_alias do
               T.any(
                 OpenAI::Realtime::RealtimeSessionCreateResponse,
-                OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse
+                OpenAI::Realtime::RealtimeTranscriptionSessionCreateResponse
               )
             end
-          class RealtimeTranscriptionSessionCreateResponse < OpenAI::Internal::Type::BaseModel
-            OrHash =
-              T.type_alias do
-                T.any(
-                  OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse,
-                  OpenAI::Internal::AnyHash
-                )
-              end
-            # Unique identifier for the session that looks like `sess_1234567890abcdef`.
-            sig { returns(T.nilable(String)) }
-            attr_reader :id
-            sig { params(id: String).void }
-            attr_writer :id
-            # Configuration for input audio for the session.
-            sig do
-              returns(
-                T.nilable(
-                  OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio
-                )
-              )
-            end
-            attr_reader :audio
-            sig do
-              params(
-                audio:
-                  OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::OrHash
-              ).void
-            end
-            attr_writer :audio
-            # Expiration timestamp for the session, in seconds since epoch.
-            sig { returns(T.nilable(Integer)) }
-            attr_reader :expires_at
-            sig { params(expires_at: Integer).void }
-            attr_writer :expires_at
-            # Additional fields to include in server outputs.
-            #
-            # - `item.input_audio_transcription.logprobs`: Include logprobs for input audio
-            #   transcription.
-            sig do
-              returns(
-                T.nilable(
-                  T::Array[
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Include::TaggedSymbol
-                  ]
-                )
-              )
-            end
-            attr_reader :include
-            sig do
-              params(
-                include:
-                  T::Array[
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Include::OrSymbol
-                  ]
-              ).void
-            end
-            attr_writer :include
-            # The object type. Always `realtime.transcription_session`.
-            sig { returns(T.nilable(String)) }
-            attr_reader :object
-            sig { params(object: String).void }
-            attr_writer :object
-            # A Realtime transcription session configuration object.
-            sig do
-              params(
-                id: String,
-                audio:
-                  OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::OrHash,
-                expires_at: Integer,
-                include:
-                  T::Array[
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Include::OrSymbol
-                  ],
-                object: String
-              ).returns(T.attached_class)
-            end
-            def self.new(
-              # Unique identifier for the session that looks like `sess_1234567890abcdef`.
-              id: nil,
-              # Configuration for input audio for the session.
-              audio: nil,
-              # Expiration timestamp for the session, in seconds since epoch.
-              expires_at: nil,
-              # Additional fields to include in server outputs.
-              #
-              # - `item.input_audio_transcription.logprobs`: Include logprobs for input audio
-              #   transcription.
-              include: nil,
-              # The object type. Always `realtime.transcription_session`.
-              object: nil
-            )
-            end
-            sig do
-              override.returns(
-                {
-                  id: String,
-                  audio:
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio,
-                  expires_at: Integer,
-                  include:
-                    T::Array[
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Include::TaggedSymbol
-                    ],
-                  object: String
-                }
-              )
-            end
-            def to_hash
-            end
-            class Audio < OpenAI::Internal::Type::BaseModel
-              OrHash =
-                T.type_alias do
-                  T.any(
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio,
-                    OpenAI::Internal::AnyHash
-                  )
-                end
-              sig do
-                returns(
-                  T.nilable(
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input
-                  )
-                )
-              end
-              attr_reader :input
-              sig do
-                params(
-                  input:
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::OrHash
-                ).void
-              end
-              attr_writer :input
-              # Configuration for input audio for the session.
-              sig do
-                params(
-                  input:
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::OrHash
-                ).returns(T.attached_class)
-              end
-              def self.new(input: nil)
-              end
-              sig do
-                override.returns(
-                  {
-                    input:
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input
-                  }
-                )
-              end
-              def to_hash
-              end
-              class Input < OpenAI::Internal::Type::BaseModel
-                OrHash =
-                  T.type_alias do
-                    T.any(
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input,
-                      OpenAI::Internal::AnyHash
-                    )
-                  end
-                # The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
-                sig { returns(T.nilable(String)) }
-                attr_reader :format_
-                sig { params(format_: String).void }
-                attr_writer :format_
-                # Configuration for input audio noise reduction.
-                sig do
-                  returns(
-                    T.nilable(
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction
-                    )
-                  )
-                end
-                attr_reader :noise_reduction
-                sig do
-                  params(
-                    noise_reduction:
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::OrHash
-                  ).void
-                end
-                attr_writer :noise_reduction
-                # Configuration of the transcription model.
-                sig do
-                  returns(
-                    T.nilable(
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription
-                    )
-                  )
-                end
-                attr_reader :transcription
-                sig do
-                  params(
-                    transcription:
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::OrHash
-                  ).void
-                end
-                attr_writer :transcription
-                # Configuration for turn detection.
-                sig do
-                  returns(
-                    T.nilable(
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::TurnDetection
-                    )
-                  )
-                end
-                attr_reader :turn_detection
-                sig do
-                  params(
-                    turn_detection:
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::TurnDetection::OrHash
-                  ).void
-                end
-                attr_writer :turn_detection
-                sig do
-                  params(
-                    format_: String,
-                    noise_reduction:
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::OrHash,
-                    transcription:
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::OrHash,
-                    turn_detection:
-                      OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::TurnDetection::OrHash
-                  ).returns(T.attached_class)
-                end
-                def self.new(
-                  # The format of input audio. Options are `pcm16`, `g711_ulaw`, or `g711_alaw`.
-                  format_: nil,
-                  # Configuration for input audio noise reduction.
-                  noise_reduction: nil,
-                  # Configuration of the transcription model.
-                  transcription: nil,
-                  # Configuration for turn detection.
-                  turn_detection: nil
-                )
-                end
-                sig do
-                  override.returns(
-                    {
-                      format_: String,
-                      noise_reduction:
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction,
-                      transcription:
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription,
-                      turn_detection:
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::TurnDetection
-                    }
-                  )
-                end
-                def to_hash
-                end
-                class NoiseReduction < OpenAI::Internal::Type::BaseModel
-                  OrHash =
-                    T.type_alias do
-                      T.any(
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction,
-                        OpenAI::Internal::AnyHash
-                      )
-                    end
-                  sig do
-                    returns(
-                      T.nilable(
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type::TaggedSymbol
-                      )
-                    )
-                  end
-                  attr_reader :type
-                  sig do
-                    params(
-                      type:
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type::OrSymbol
-                    ).void
-                  end
-                  attr_writer :type
-                  # Configuration for input audio noise reduction.
-                  sig do
-                    params(
-                      type:
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type::OrSymbol
-                    ).returns(T.attached_class)
-                  end
-                  def self.new(type: nil)
-                  end
-                  sig do
-                    override.returns(
-                      {
-                        type:
-                          OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type::TaggedSymbol
-                      }
-                    )
-                  end
-                  def to_hash
-                  end
-                  module Type
-                    extend OpenAI::Internal::Type::Enum
-                    TaggedSymbol =
-                      T.type_alias do
-                        T.all(
-                          Symbol,
-                          OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type
-                        )
-                      end
-                    OrSymbol = T.type_alias { T.any(Symbol, String) }
-                    NEAR_FIELD =
-                      T.let(
-                        :near_field,
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type::TaggedSymbol
-                      )
-                    FAR_FIELD =
-                      T.let(
-                        :far_field,
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type::TaggedSymbol
-                      )
-                    sig do
-                      override.returns(
-                        T::Array[
-                          OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::NoiseReduction::Type::TaggedSymbol
-                        ]
-                      )
-                    end
-                    def self.values
-                    end
-                  end
-                end
-                class Transcription < OpenAI::Internal::Type::BaseModel
-                  OrHash =
-                    T.type_alias do
-                      T.any(
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription,
-                        OpenAI::Internal::AnyHash
-                      )
-                    end
-                  # The language of the input audio. Supplying the input language in
-                  # [ISO-639-1](https://en.wikipedia.org/wiki/List_of_ISO_639-1_codes) (e.g. `en`)
-                  # format will improve accuracy and latency.
-                  sig { returns(T.nilable(String)) }
-                  attr_reader :language
-                  sig { params(language: String).void }
-                  attr_writer :language
-                  # The model to use for transcription. Can be `gpt-4o-transcribe`,
-                  # `gpt-4o-mini-transcribe`, or `whisper-1`.
-                  sig do
-                    returns(
-                      T.nilable(
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::TaggedSymbol
-                      )
-                    )
-                  end
-                  attr_reader :model
-                  sig do
-                    params(
-                      model:
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::OrSymbol
-                    ).void
-                  end
-                  attr_writer :model
-                  # An optional text to guide the model's style or continue a previous audio
-                  # segment. The
-                  # [prompt](https://platform.openai.com/docs/guides/speech-to-text#prompting)
-                  # should match the audio language.
-                  sig { returns(T.nilable(String)) }
-                  attr_reader :prompt
-                  sig { params(prompt: String).void }
-                  attr_writer :prompt
-                  # Configuration of the transcription model.
-                  sig do
-                    params(
-                      language: String,
-                      model:
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::OrSymbol,
-                      prompt: String
-                    ).returns(T.attached_class)
-                  end
-                  def self.new(
-                    # The language of the input audio. Supplying the input language in
-                    # [ISO-639-1](https://en.wikipedia.org/wiki/List_of_ISO_639-1_codes) (e.g. `en`)
-                    # format will improve accuracy and latency.
-                    language: nil,
-                    # The model to use for transcription. Can be `gpt-4o-transcribe`,
-                    # `gpt-4o-mini-transcribe`, or `whisper-1`.
-                    model: nil,
-                    # An optional text to guide the model's style or continue a previous audio
-                    # segment. The
-                    # [prompt](https://platform.openai.com/docs/guides/speech-to-text#prompting)
-                    # should match the audio language.
-                    prompt: nil
-                  )
-                  end
-                  sig do
-                    override.returns(
-                      {
-                        language: String,
-                        model:
-                          OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::TaggedSymbol,
-                        prompt: String
-                      }
-                    )
-                  end
-                  def to_hash
-                  end
-                  # The model to use for transcription. Can be `gpt-4o-transcribe`,
-                  # `gpt-4o-mini-transcribe`, or `whisper-1`.
-                  module Model
-                    extend OpenAI::Internal::Type::Enum
-                    TaggedSymbol =
-                      T.type_alias do
-                        T.all(
-                          Symbol,
-                          OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model
-                        )
-                      end
-                    OrSymbol = T.type_alias { T.any(Symbol, String) }
-                    GPT_4O_TRANSCRIBE =
-                      T.let(
-                        :"gpt-4o-transcribe",
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::TaggedSymbol
-                      )
-                    GPT_4O_MINI_TRANSCRIBE =
-                      T.let(
-                        :"gpt-4o-mini-transcribe",
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::TaggedSymbol
-                      )
-                    WHISPER_1 =
-                      T.let(
-                        :"whisper-1",
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::TaggedSymbol
-                      )
-                    sig do
-                      override.returns(
-                        T::Array[
-                          OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::Transcription::Model::TaggedSymbol
-                        ]
-                      )
-                    end
-                    def self.values
-                    end
-                  end
-                end
-                class TurnDetection < OpenAI::Internal::Type::BaseModel
-                  OrHash =
-                    T.type_alias do
-                      T.any(
-                        OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Audio::Input::TurnDetection,
-                        OpenAI::Internal::AnyHash
-                      )
-                    end
-                  sig { returns(T.nilable(Integer)) }
-                  attr_reader :prefix_padding_ms
-                  sig { params(prefix_padding_ms: Integer).void }
-                  attr_writer :prefix_padding_ms
-                  sig { returns(T.nilable(Integer)) }
-                  attr_reader :silence_duration_ms
-                  sig { params(silence_duration_ms: Integer).void }
-                  attr_writer :silence_duration_ms
-                  sig { returns(T.nilable(Float)) }
-                  attr_reader :threshold
-                  sig { params(threshold: Float).void }
-                  attr_writer :threshold
-                  # Type of turn detection, only `server_vad` is currently supported.
-                  sig { returns(T.nilable(String)) }
-                  attr_reader :type
-                  sig { params(type: String).void }
-                  attr_writer :type
-                  # Configuration for turn detection.
-                  sig do
-                    params(
-                      prefix_padding_ms: Integer,
-                      silence_duration_ms: Integer,
-                      threshold: Float,
-                      type: String
-                    ).returns(T.attached_class)
-                  end
-                  def self.new(
-                    prefix_padding_ms: nil,
-                    silence_duration_ms: nil,
-                    threshold: nil,
-                    # Type of turn detection, only `server_vad` is currently supported.
-                    type: nil
-                  )
-                  end
-                  sig do
-                    override.returns(
-                      {
-                        prefix_padding_ms: Integer,
-                        silence_duration_ms: Integer,
-                        threshold: Float,
-                        type: String
-                      }
-                    )
-                  end
-                  def to_hash
-                  end
-                end
-              end
-            end
-            module Include
-              extend OpenAI::Internal::Type::Enum
-              TaggedSymbol =
-                T.type_alias do
-                  T.all(
-                    Symbol,
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Include
-                  )
-                end
-              OrSymbol = T.type_alias { T.any(Symbol, String) }
-              ITEM_INPUT_AUDIO_TRANSCRIPTION_LOGPROBS =
-                T.let(
-                  :"item.input_audio_transcription.logprobs",
-                  OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Include::TaggedSymbol
-                )
-              sig do
-                override.returns(
-                  T::Array[
-                    OpenAI::Models::Realtime::ClientSecretCreateResponse::Session::RealtimeTranscriptionSessionCreateResponse::Include::TaggedSymbol
-                  ]
-                )
-              end
-              def self.values
-              end
-            end
-          end
           sig do
             override.returns(
               T::Array[

data/rbi/openai/models/realtime/conversation_item_added.rbi CHANGED Viewed

@@ -43,7 +43,20 @@ module OpenAI
         sig { returns(T.nilable(String)) }
         attr_accessor :previous_item_id
-        # Returned when a conversation item is added.
+        # Sent by the server when an Item is added to the default Conversation. This can
+        # happen in several cases:
+        #
+        # - When the client sends a `conversation.item.create` event.
+        # - When the input audio buffer is committed. In this case the item will be a user
+        #   message containing the audio from the buffer.
+        # - When the model is generating a Response. In this case the
+        #   `conversation.item.added` event will be sent when the model starts generating
+        #   a specific Item, and thus it will not yet have any content (and `status` will
+        #   be `in_progress`).
+        #
+        # The event will include the full content of the Item (except when model is
+        # generating a Response) except for audio data, which can be retrieved separately
+        # with a `conversation.item.retrieve` event if necessary.
         sig do
           params(
             event_id: String,

data/rbi/openai/models/realtime/conversation_item_done.rbi CHANGED Viewed

@@ -44,6 +44,9 @@ module OpenAI
         attr_accessor :previous_item_id
         # Returned when a conversation item is finalized.
+        #
+        # The event will include the full content of the Item except for audio data, which
+        # can be retrieved separately with a `conversation.item.retrieve` event if needed.
         sig do
           params(
             event_id: String,

data/rbi/openai/models/realtime/conversation_item_input_audio_transcription_completed_event.rbi CHANGED Viewed

@@ -20,7 +20,7 @@ module OpenAI
         sig { returns(String) }
         attr_accessor :event_id
-        # The ID of the user message item containing the audio.
+        # The ID of the item containing the audio that is being transcribed.
         sig { returns(String) }
         attr_accessor :item_id
@@ -32,7 +32,8 @@ module OpenAI
         sig { returns(Symbol) }
         attr_accessor :type
-        # Usage statistics for the transcription.
+        # Usage statistics for the transcription, this is billed according to the ASR
+        # model's pricing rather than the realtime model's pricing.
         sig do
           returns(
             T.any(
@@ -51,9 +52,9 @@ module OpenAI
         # This event is the output of audio transcription for user audio written to the
         # user audio buffer. Transcription begins when the input audio buffer is committed
-        # by the client or server (in `server_vad` mode). Transcription runs
-        # asynchronously with Response creation, so this event may come before or after
-        # the Response events.
+        # by the client or server (when VAD is enabled). Transcription runs asynchronously
+        # with Response creation, so this event may come before or after the Response
+        # events.
         #
         # Realtime API models accept audio natively, and thus input transcription is a
         # separate process run on a separate ASR (Automatic Speech Recognition) model. The
@@ -80,11 +81,12 @@ module OpenAI
           content_index:,
           # The unique ID of the server event.
           event_id:,
-          # The ID of the user message item containing the audio.
+          # The ID of the item containing the audio that is being transcribed.
           item_id:,
           # The transcribed text.
           transcript:,
-          # Usage statistics for the transcription.
+          # Usage statistics for the transcription, this is billed according to the ASR
+          # model's pricing rather than the realtime model's pricing.
           usage:,
           # The log probabilities of the transcription.
           logprobs: nil,
@@ -113,7 +115,8 @@ module OpenAI
         def to_hash
         end
-        # Usage statistics for the transcription.
+        # Usage statistics for the transcription, this is billed according to the ASR
+        # model's pricing rather than the realtime model's pricing.
         module Usage
           extend OpenAI::Internal::Type::Union