openai
diff --git a/‎.stats.yml‎
Lines changed: 3 additions & 3 deletions b/‎.stats.yml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎lib/openai/models/audio/speech_create_params.rb‎
Lines changed: 23 additions & 2 deletions b/‎lib/openai/models/audio/speech_create_params.rb‎
Lines changed: 23 additions & 2 deletions
diff --git a/‎lib/openai/models/audio/transcription.rb‎
Lines changed: 118 additions & 1 deletion b/‎lib/openai/models/audio/transcription.rb‎
Lines changed: 118 additions & 1 deletion
diff --git a/‎lib/openai/models/audio/transcription_text_done_event.rb‎
Lines changed: 80 additions & 1 deletion b/‎lib/openai/models/audio/transcription_text_done_event.rb‎
Lines changed: 80 additions & 1 deletion
diff --git a/‎lib/openai/models/audio/transcription_verbose.rb‎
Lines changed: 31 additions & 1 deletion b/‎lib/openai/models/audio/transcription_verbose.rb‎
Lines changed: 31 additions & 1 deletion
@@ -1,4 +1,4 @@
 configured_endpoints: 109
-openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-f411a68f272b8be0ab0c266043da33228687b9b2d76896724e3cef797de9563d.yml
-openapi_spec_hash: 89bf866ea95ecfb3d76c8833237047d6
-config_hash: dc5515e257676a27cb1ace1784aa92b3
+openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-ef4ecb19eb61e24c49d77fef769ee243e5279bc0bdbaee8d0f8dba4da8722559.yml
+openapi_spec_hash: 1b8a9767c9f04e6865b06c41948cdc24
+config_hash: fd2af1d5eff0995bb7dc02ac9a34851d
@@ -46,12 +46,19 @@ class SpeechCreateParams < OpenAI::Internal::Type::BaseModel
 
         # @!attribute speed
         #   The speed of the generated audio. Select a value from `0.25` to `4.0`. `1.0` is
-        #   the default. Does not work with `gpt-4o-mini-tts`.
+        #   the default.
         #
         #   @return [Float, nil]
         optional :speed, Float
 
-        # @!method initialize(input:, model:, voice:, instructions: nil, response_format: nil, speed: nil, request_options: {})
+        # @!attribute stream_format
+        #   The format to stream the audio in. Supported formats are `sse` and `audio`.
+        #   `sse` is not supported for `tts-1` or `tts-1-hd`.
+        #
+        #   @return [Symbol, OpenAI::Models::Audio::SpeechCreateParams::StreamFormat, nil]
+        optional :stream_format, enum: -> { OpenAI::Audio::SpeechCreateParams::StreamFormat }
+
+        # @!method initialize(input:, model:, voice:, instructions: nil, response_format: nil, speed: nil, stream_format: nil, request_options: {})
         #   Some parameter documentations has been truncated, see
         #   {OpenAI::Models::Audio::SpeechCreateParams} for more details.
         #
@@ -67,6 +74,8 @@ class SpeechCreateParams < OpenAI::Internal::Type::BaseModel
         #
         #   @param speed [Float] The speed of the generated audio. Select a value from `0.25` to `4.0`. `1.0` is
         #
+        #   @param stream_format [Symbol, OpenAI::Models::Audio::SpeechCreateParams::StreamFormat] The format to stream the audio in. Supported formats are `sse` and `audio`. `sse
+        #
         #   @param request_options [OpenAI::RequestOptions, Hash{Symbol=>Object}]
 
         # One of the available [TTS models](https://platform.openai.com/docs/models#tts):
@@ -153,6 +162,18 @@ module ResponseFormat
           # @!method self.values
           #   @return [Array<Symbol>]
         end
+
+        # The format to stream the audio in. Supported formats are `sse` and `audio`.
+        # `sse` is not supported for `tts-1` or `tts-1-hd`.
+        module StreamFormat
+          extend OpenAI::Internal::Type::Enum
+
+          SSE = :sse
+          AUDIO = :audio
+
+          # @!method self.values
+          #   @return [Array<Symbol>]
+        end
       end
     end
   end
 
@@ -18,7 +18,13 @@ class Transcription < OpenAI::Internal::Type::BaseModel
         #   @return [Array<OpenAI::Models::Audio::Transcription::Logprob>, nil]
         optional :logprobs, -> { OpenAI::Internal::Type::ArrayOf[OpenAI::Audio::Transcription::Logprob] }
 
-        # @!method initialize(text:, logprobs: nil)
+        # @!attribute usage
+        #   Token usage statistics for the request.
+        #
+        #   @return [OpenAI::Models::Audio::Transcription::Usage::Tokens, OpenAI::Models::Audio::Transcription::Usage::Duration, nil]
+        optional :usage, union: -> { OpenAI::Audio::Transcription::Usage }
+
+        # @!method initialize(text:, logprobs: nil, usage: nil)
         #   Some parameter documentations has been truncated, see
         #   {OpenAI::Models::Audio::Transcription} for more details.
         #
@@ -28,6 +34,8 @@ class Transcription < OpenAI::Internal::Type::BaseModel
         #   @param text [String] The transcribed text.
         #
         #   @param logprobs [Array<OpenAI::Models::Audio::Transcription::Logprob>] The log probabilities of the tokens in the transcription. Only returned with the
+        #
+        #   @param usage [OpenAI::Models::Audio::Transcription::Usage::Tokens, OpenAI::Models::Audio::Transcription::Usage::Duration] Token usage statistics for the request.
 
         class Logprob < OpenAI::Internal::Type::BaseModel
           # @!attribute token
@@ -55,6 +63,115 @@ class Logprob < OpenAI::Internal::Type::BaseModel
           #
           #   @param logprob [Float] The log probability of the token.
         end
+
+        # Token usage statistics for the request.
+        #
+        # @see OpenAI::Models::Audio::Transcription#usage
+        module Usage
+          extend OpenAI::Internal::Type::Union
+
+          discriminator :type
+
+          # Usage statistics for models billed by token usage.
+          variant :tokens, -> { OpenAI::Audio::Transcription::Usage::Tokens }
+
+          # Usage statistics for models billed by audio input duration.
+          variant :duration, -> { OpenAI::Audio::Transcription::Usage::Duration }
+
+          class Tokens < OpenAI::Internal::Type::BaseModel
+            # @!attribute input_tokens
+            #   Number of input tokens billed for this request.
+            #
+            #   @return [Integer]
+            required :input_tokens, Integer
+
+            # @!attribute output_tokens
+            #   Number of output tokens generated.
+            #
+            #   @return [Integer]
+            required :output_tokens, Integer
+
+            # @!attribute total_tokens
+            #   Total number of tokens used (input + output).
+            #
+            #   @return [Integer]
+            required :total_tokens, Integer
+
+            # @!attribute type
+            #   The type of the usage object. Always `tokens` for this variant.
+            #
+            #   @return [Symbol, :tokens]
+            required :type, const: :tokens
+
+            # @!attribute input_token_details
+            #   Details about the input tokens billed for this request.
+            #
+            #   @return [OpenAI::Models::Audio::Transcription::Usage::Tokens::InputTokenDetails, nil]
+            optional :input_token_details,
+                     -> {
+                       OpenAI::Audio::Transcription::Usage::Tokens::InputTokenDetails
+                     }
+
+            # @!method initialize(input_tokens:, output_tokens:, total_tokens:, input_token_details: nil, type: :tokens)
+            #   Usage statistics for models billed by token usage.
+            #
+            #   @param input_tokens [Integer] Number of input tokens billed for this request.
+            #
+            #   @param output_tokens [Integer] Number of output tokens generated.
+            #
+            #   @param total_tokens [Integer] Total number of tokens used (input + output).
+            #
+            #   @param input_token_details [OpenAI::Models::Audio::Transcription::Usage::Tokens::InputTokenDetails] Details about the input tokens billed for this request.
+            #
+            #   @param type [Symbol, :tokens] The type of the usage object. Always `tokens` for this variant.
+
+            # @see OpenAI::Models::Audio::Transcription::Usage::Tokens#input_token_details
+            class InputTokenDetails < OpenAI::Internal::Type::BaseModel
+              # @!attribute audio_tokens
+              #   Number of audio tokens billed for this request.
+              #
+              #   @return [Integer, nil]
+              optional :audio_tokens, Integer
+
+              # @!attribute text_tokens
+              #   Number of text tokens billed for this request.
+              #
+              #   @return [Integer, nil]
+              optional :text_tokens, Integer
+
+              # @!method initialize(audio_tokens: nil, text_tokens: nil)
+              #   Details about the input tokens billed for this request.
+              #
+              #   @param audio_tokens [Integer] Number of audio tokens billed for this request.
+              #
+              #   @param text_tokens [Integer] Number of text tokens billed for this request.
+            end
+          end
+
+          class Duration < OpenAI::Internal::Type::BaseModel
+            # @!attribute duration
+            #   Duration of the input audio in seconds.
+            #
+            #   @return [Float]
+            required :duration, Float
+
+            # @!attribute type
+            #   The type of the usage object. Always `duration` for this variant.
+            #
+            #   @return [Symbol, :duration]
+            required :type, const: :duration
+
+            # @!method initialize(duration:, type: :duration)
+            #   Usage statistics for models billed by audio input duration.
+            #
+            #   @param duration [Float] Duration of the input audio in seconds.
+            #
+            #   @param type [Symbol, :duration] The type of the usage object. Always `duration` for this variant.
+          end
+
+          # @!method self.variants
+          #   @return [Array(OpenAI::Models::Audio::Transcription::Usage::Tokens, OpenAI::Models::Audio::Transcription::Usage::Duration)]
+        end
       end
     end
   end
 
@@ -26,7 +26,13 @@ class TranscriptionTextDoneEvent < OpenAI::Internal::Type::BaseModel
         optional :logprobs,
                  -> { OpenAI::Internal::Type::ArrayOf[OpenAI::Audio::TranscriptionTextDoneEvent::Logprob] }
 
-        # @!method initialize(text:, logprobs: nil, type: :"transcript.text.done")
+        # @!attribute usage
+        #   Usage statistics for models billed by token usage.
+        #
+        #   @return [OpenAI::Models::Audio::TranscriptionTextDoneEvent::Usage, nil]
+        optional :usage, -> { OpenAI::Audio::TranscriptionTextDoneEvent::Usage }
+
+        # @!method initialize(text:, logprobs: nil, usage: nil, type: :"transcript.text.done")
         #   Some parameter documentations has been truncated, see
         #   {OpenAI::Models::Audio::TranscriptionTextDoneEvent} for more details.
         #
@@ -39,6 +45,8 @@ class TranscriptionTextDoneEvent < OpenAI::Internal::Type::BaseModel
         #
         #   @param logprobs [Array<OpenAI::Models::Audio::TranscriptionTextDoneEvent::Logprob>] The log probabilities of the individual tokens in the transcription. Only includ
         #
+        #   @param usage [OpenAI::Models::Audio::TranscriptionTextDoneEvent::Usage] Usage statistics for models billed by token usage.
+        #
         #   @param type [Symbol, :"transcript.text.done"] The type of the event. Always `transcript.text.done`.
 
         class Logprob < OpenAI::Internal::Type::BaseModel
@@ -70,6 +78,77 @@ class Logprob < OpenAI::Internal::Type::BaseModel
           #
           #   @param logprob [Float] The log probability of the token.
         end
+
+        # @see OpenAI::Models::Audio::TranscriptionTextDoneEvent#usage
+        class Usage < OpenAI::Internal::Type::BaseModel
+          # @!attribute input_tokens
+          #   Number of input tokens billed for this request.
+          #
+          #   @return [Integer]
+          required :input_tokens, Integer
+
+          # @!attribute output_tokens
+          #   Number of output tokens generated.
+          #
+          #   @return [Integer]
+          required :output_tokens, Integer
+
+          # @!attribute total_tokens
+          #   Total number of tokens used (input + output).
+          #
+          #   @return [Integer]
+          required :total_tokens, Integer
+
+          # @!attribute type
+          #   The type of the usage object. Always `tokens` for this variant.
+          #
+          #   @return [Symbol, :tokens]
+          required :type, const: :tokens
+
+          # @!attribute input_token_details
+          #   Details about the input tokens billed for this request.
+          #
+          #   @return [OpenAI::Models::Audio::TranscriptionTextDoneEvent::Usage::InputTokenDetails, nil]
+          optional :input_token_details,
+                   -> {
+                     OpenAI::Audio::TranscriptionTextDoneEvent::Usage::InputTokenDetails
+                   }
+
+          # @!method initialize(input_tokens:, output_tokens:, total_tokens:, input_token_details: nil, type: :tokens)
+          #   Usage statistics for models billed by token usage.
+          #
+          #   @param input_tokens [Integer] Number of input tokens billed for this request.
+          #
+          #   @param output_tokens [Integer] Number of output tokens generated.
+          #
+          #   @param total_tokens [Integer] Total number of tokens used (input + output).
+          #
+          #   @param input_token_details [OpenAI::Models::Audio::TranscriptionTextDoneEvent::Usage::InputTokenDetails] Details about the input tokens billed for this request.
+          #
+          #   @param type [Symbol, :tokens] The type of the usage object. Always `tokens` for this variant.
+
+          # @see OpenAI::Models::Audio::TranscriptionTextDoneEvent::Usage#input_token_details
+          class InputTokenDetails < OpenAI::Internal::Type::BaseModel
+            # @!attribute audio_tokens
+            #   Number of audio tokens billed for this request.
+            #
+            #   @return [Integer, nil]
+            optional :audio_tokens, Integer
+
+            # @!attribute text_tokens
+            #   Number of text tokens billed for this request.
+            #
+            #   @return [Integer, nil]
+            optional :text_tokens, Integer
+
+            # @!method initialize(audio_tokens: nil, text_tokens: nil)
+            #   Details about the input tokens billed for this request.
+            #
+            #   @param audio_tokens [Integer] Number of audio tokens billed for this request.
+            #
+            #   @param text_tokens [Integer] Number of text tokens billed for this request.
+          end
+        end
       end
     end
   end
 
@@ -28,13 +28,19 @@ class TranscriptionVerbose < OpenAI::Internal::Type::BaseModel
         #   @return [Array<OpenAI::Models::Audio::TranscriptionSegment>, nil]
         optional :segments, -> { OpenAI::Internal::Type::ArrayOf[OpenAI::Audio::TranscriptionSegment] }
 
+        # @!attribute usage
+        #   Usage statistics for models billed by audio input duration.
+        #
+        #   @return [OpenAI::Models::Audio::TranscriptionVerbose::Usage, nil]
+        optional :usage, -> { OpenAI::Audio::TranscriptionVerbose::Usage }
+
         # @!attribute words
         #   Extracted words and their corresponding timestamps.
         #
         #   @return [Array<OpenAI::Models::Audio::TranscriptionWord>, nil]
         optional :words, -> { OpenAI::Internal::Type::ArrayOf[OpenAI::Audio::TranscriptionWord] }
 
-        # @!method initialize(duration:, language:, text:, segments: nil, words: nil)
+        # @!method initialize(duration:, language:, text:, segments: nil, usage: nil, words: nil)
         #   Represents a verbose json transcription response returned by model, based on the
         #   provided input.
         #
@@ -46,7 +52,31 @@ class TranscriptionVerbose < OpenAI::Internal::Type::BaseModel
         #
         #   @param segments [Array<OpenAI::Models::Audio::TranscriptionSegment>] Segments of the transcribed text and their corresponding details.
         #
+        #   @param usage [OpenAI::Models::Audio::TranscriptionVerbose::Usage] Usage statistics for models billed by audio input duration.
+        #
         #   @param words [Array<OpenAI::Models::Audio::TranscriptionWord>] Extracted words and their corresponding timestamps.
+
+        # @see OpenAI::Models::Audio::TranscriptionVerbose#usage
+        class Usage < OpenAI::Internal::Type::BaseModel
+          # @!attribute duration
+          #   Duration of the input audio in seconds.
+          #
+          #   @return [Float]
+          required :duration, Float
+
+          # @!attribute type
+          #   The type of the usage object. Always `duration` for this variant.
+          #
+          #   @return [Symbol, :duration]
+          required :type, const: :duration
+
+          # @!method initialize(duration:, type: :duration)
+          #   Usage statistics for models billed by audio input duration.
+          #
+          #   @param duration [Float] Duration of the input audio in seconds.
+          #
+          #   @param type [Symbol, :duration] The type of the usage object. Always `duration` for this variant.
+        end
       end
     end
   end