openai
diff --git a/‎.stats.yml‎
Lines changed: 3 additions & 3 deletions b/‎.stats.yml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎lib/openai/models/chat/chat_completion.rb‎
Lines changed: 36 additions & 3 deletions b/‎lib/openai/models/chat/chat_completion.rb‎
Lines changed: 36 additions & 3 deletions
diff --git a/‎lib/openai/models/chat/chat_completion_audio_param.rb‎
Lines changed: 3 additions & 2 deletions b/‎lib/openai/models/chat/chat_completion_audio_param.rb‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎lib/openai/models/chat/chat_completion_chunk.rb‎
Lines changed: 36 additions & 3 deletions b/‎lib/openai/models/chat/chat_completion_chunk.rb‎
Lines changed: 36 additions & 3 deletions
diff --git a/‎lib/openai/models/chat/completion_create_params.rb‎
Lines changed: 15 additions & 4 deletions b/‎lib/openai/models/chat/completion_create_params.rb‎
Lines changed: 15 additions & 4 deletions
diff --git a/‎lib/openai/models/chat_model.rb‎
Lines changed: 4 additions & 0 deletions b/‎lib/openai/models/chat_model.rb‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎lib/openai/models/completion_create_params.rb‎
Lines changed: 4 additions & 0 deletions b/‎lib/openai/models/completion_create_params.rb‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎lib/openai/models/reasoning.rb‎
Lines changed: 38 additions & 7 deletions b/‎lib/openai/models/reasoning.rb‎
Lines changed: 38 additions & 7 deletions
@@ -1,4 +1,4 @@
 configured_endpoints: 95
-openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-a555f81249cb084f463dcefa4aba069f9341fdaf3dd6ac27d7f237fc90e8f488.yml
-openapi_spec_hash: 8e590296cd1a54b9508510b0c7a2c45a
-config_hash: 5ea32de61ff42fcf5e66cff8d9e247ea
+openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-5633633cc38734869cf7d993f7b549bb8e4d10e0ec45381ec2cd91507cd8eb8f.yml
+openapi_spec_hash: c855121b2b2324b99499c9244c21d24d
+config_hash: d20837393b73efdb19cd08e04c1cc9a1
@@ -39,7 +39,23 @@ class ChatCompletion < OpenAI::Internal::Type::BaseModel
         required :object, const: :"chat.completion"
 
         # @!attribute service_tier
-        #   The service tier used for processing the request.
+        #   Specifies the latency tier to use for processing the request. This parameter is
+        #   relevant for customers subscribed to the scale tier service:
+        #
+        #   - If set to 'auto', and the Project is Scale tier enabled, the system will
+        #     utilize scale tier credits until they are exhausted.
+        #   - If set to 'auto', and the Project is not Scale tier enabled, the request will
+        #     be processed using the default service tier with a lower uptime SLA and no
+        #     latency guarentee.
+        #   - If set to 'default', the request will be processed using the default service
+        #     tier with a lower uptime SLA and no latency guarentee.
+        #   - If set to 'flex', the request will be processed with the Flex Processing
+        #     service tier.
+        #     [Learn more](https://platform.openai.com/docs/guides/flex-processing).
+        #   - When not set, the default behavior is 'auto'.
+        #
+        #   When this parameter is set, the response body will include the `service_tier`
+        #   utilized.
         #
         #   @return [Symbol, OpenAI::Models::Chat::ChatCompletion::ServiceTier, nil]
         optional :service_tier, enum: -> { OpenAI::Models::Chat::ChatCompletion::ServiceTier }, nil?: true
@@ -190,14 +206,31 @@ class Logprobs < OpenAI::Internal::Type::BaseModel
           end
         end
 
-        # The service tier used for processing the request.
+        # Specifies the latency tier to use for processing the request. This parameter is
+        # relevant for customers subscribed to the scale tier service:
+        #
+        # - If set to 'auto', and the Project is Scale tier enabled, the system will
+        #   utilize scale tier credits until they are exhausted.
+        # - If set to 'auto', and the Project is not Scale tier enabled, the request will
+        #   be processed using the default service tier with a lower uptime SLA and no
+        #   latency guarentee.
+        # - If set to 'default', the request will be processed using the default service
+        #   tier with a lower uptime SLA and no latency guarentee.
+        # - If set to 'flex', the request will be processed with the Flex Processing
+        #   service tier.
+        #   [Learn more](https://platform.openai.com/docs/guides/flex-processing).
+        # - When not set, the default behavior is 'auto'.
+        #
+        # When this parameter is set, the response body will include the `service_tier`
+        # utilized.
         #
         # @see OpenAI::Models::Chat::ChatCompletion#service_tier
         module ServiceTier
           extend OpenAI::Internal::Type::Enum
 
-          SCALE = :scale
+          AUTO = :auto
           DEFAULT = :default
+          FLEX = :flex
 
           finalize!
 
 
@@ -13,7 +13,7 @@ class ChatCompletionAudioParam < OpenAI::Internal::Type::BaseModel
 
         # @!attribute voice
         #   The voice the model uses to respond. Supported voices are `alloy`, `ash`,
-        #   `ballad`, `coral`, `echo`, `sage`, and `shimmer`.
+        #   `ballad`, `coral`, `echo`, `fable`, `nova`, `onyx`, `sage`, and `shimmer`.
         #
         #   @return [String, Symbol, OpenAI::Models::Chat::ChatCompletionAudioParam::Voice]
         required :voice, union: -> { OpenAI::Models::Chat::ChatCompletionAudioParam::Voice }
@@ -38,6 +38,7 @@ module Format
           extend OpenAI::Internal::Type::Enum
 
           WAV = :wav
+          AAC = :aac
           MP3 = :mp3
           FLAC = :flac
           OPUS = :opus
@@ -51,7 +52,7 @@ module Format
         end
 
         # The voice the model uses to respond. Supported voices are `alloy`, `ash`,
-        # `ballad`, `coral`, `echo`, `sage`, and `shimmer`.
+        # `ballad`, `coral`, `echo`, `fable`, `nova`, `onyx`, `sage`, and `shimmer`.
         #
         # @see OpenAI::Models::Chat::ChatCompletionAudioParam#voice
         module Voice
 
@@ -39,7 +39,23 @@ class ChatCompletionChunk < OpenAI::Internal::Type::BaseModel
         required :object, const: :"chat.completion.chunk"
 
         # @!attribute service_tier
-        #   The service tier used for processing the request.
+        #   Specifies the latency tier to use for processing the request. This parameter is
+        #   relevant for customers subscribed to the scale tier service:
+        #
+        #   - If set to 'auto', and the Project is Scale tier enabled, the system will
+        #     utilize scale tier credits until they are exhausted.
+        #   - If set to 'auto', and the Project is not Scale tier enabled, the request will
+        #     be processed using the default service tier with a lower uptime SLA and no
+        #     latency guarentee.
+        #   - If set to 'default', the request will be processed using the default service
+        #     tier with a lower uptime SLA and no latency guarentee.
+        #   - If set to 'flex', the request will be processed with the Flex Processing
+        #     service tier.
+        #     [Learn more](https://platform.openai.com/docs/guides/flex-processing).
+        #   - When not set, the default behavior is 'auto'.
+        #
+        #   When this parameter is set, the response body will include the `service_tier`
+        #   utilized.
         #
         #   @return [Symbol, OpenAI::Models::Chat::ChatCompletionChunk::ServiceTier, nil]
         optional :service_tier, enum: -> { OpenAI::Models::Chat::ChatCompletionChunk::ServiceTier }, nil?: true
@@ -406,14 +422,31 @@ class Logprobs < OpenAI::Internal::Type::BaseModel
           end
         end
 
-        # The service tier used for processing the request.
+        # Specifies the latency tier to use for processing the request. This parameter is
+        # relevant for customers subscribed to the scale tier service:
+        #
+        # - If set to 'auto', and the Project is Scale tier enabled, the system will
+        #   utilize scale tier credits until they are exhausted.
+        # - If set to 'auto', and the Project is not Scale tier enabled, the request will
+        #   be processed using the default service tier with a lower uptime SLA and no
+        #   latency guarentee.
+        # - If set to 'default', the request will be processed using the default service
+        #   tier with a lower uptime SLA and no latency guarentee.
+        # - If set to 'flex', the request will be processed with the Flex Processing
+        #   service tier.
+        #   [Learn more](https://platform.openai.com/docs/guides/flex-processing).
+        # - When not set, the default behavior is 'auto'.
+        #
+        # When this parameter is set, the response body will include the `service_tier`
+        # utilized.
         #
         # @see OpenAI::Models::Chat::ChatCompletionChunk#service_tier
         module ServiceTier
           extend OpenAI::Internal::Type::Enum
 
-          SCALE = :scale
+          AUTO = :auto
           DEFAULT = :default
+          FLEX = :flex
 
           finalize!
 
 
@@ -24,7 +24,7 @@ class CompletionCreateParams < OpenAI::Internal::Type::BaseModel
                  -> { OpenAI::Internal::Type::ArrayOf[union: OpenAI::Models::Chat::ChatCompletionMessageParam] }
 
         # @!attribute model
-        #   Model ID used to generate the response, like `gpt-4o` or `o1`. OpenAI offers a
+        #   Model ID used to generate the response, like `gpt-4o` or `o3`. OpenAI offers a
         #   wide range of models with different capabilities, performance characteristics,
         #   and price points. Refer to the
         #   [model guide](https://platform.openai.com/docs/models) to browse and compare
@@ -121,7 +121,7 @@ class CompletionCreateParams < OpenAI::Internal::Type::BaseModel
         #
         #   This value is now deprecated in favor of `max_completion_tokens`, and is not
         #   compatible with
-        #   [o1 series models](https://platform.openai.com/docs/guides/reasoning).
+        #   [o-series models](https://platform.openai.com/docs/guides/reasoning).
         #
         #   @return [Integer, nil]
         optional :max_tokens, Integer, nil?: true
@@ -240,6 +240,9 @@ class CompletionCreateParams < OpenAI::Internal::Type::BaseModel
         #     latency guarentee.
         #   - If set to 'default', the request will be processed using the default service
         #     tier with a lower uptime SLA and no latency guarentee.
+        #   - If set to 'flex', the request will be processed with the Flex Processing
+        #     service tier.
+        #     [Learn more](https://platform.openai.com/docs/guides/flex-processing).
         #   - When not set, the default behavior is 'auto'.
         #
         #   When this parameter is set, the response body will include the `service_tier`
@@ -249,6 +252,8 @@ class CompletionCreateParams < OpenAI::Internal::Type::BaseModel
         optional :service_tier, enum: -> { OpenAI::Models::Chat::CompletionCreateParams::ServiceTier }, nil?: true
 
         # @!attribute stop
+        #   Not supported with latest reasoning models `o3` and `o4-mini`.
+        #
         #   Up to 4 sequences where the API will stop generating further tokens. The
         #   returned text will not contain the stop sequence.
         #
@@ -422,7 +427,7 @@ class CompletionCreateParams < OpenAI::Internal::Type::BaseModel
 
         # def initialize: (Hash | OpenAI::Internal::Type::BaseModel) -> void
 
-        # Model ID used to generate the response, like `gpt-4o` or `o1`. OpenAI offers a
+        # Model ID used to generate the response, like `gpt-4o` or `o3`. OpenAI offers a
         # wide range of models with different capabilities, performance characteristics,
         # and price points. Refer to the
         # [model guide](https://platform.openai.com/docs/models) to browse and compare
@@ -432,7 +437,7 @@ module Model
 
           variant String
 
-          # Model ID used to generate the response, like `gpt-4o` or `o1`. OpenAI
+          # Model ID used to generate the response, like `gpt-4o` or `o3`. OpenAI
           # offers a wide range of models with different capabilities, performance
           # characteristics, and price points. Refer to the [model guide](https://platform.openai.com/docs/models)
           # to browse and compare available models.
@@ -589,6 +594,9 @@ module ResponseFormat
         #   latency guarentee.
         # - If set to 'default', the request will be processed using the default service
         #   tier with a lower uptime SLA and no latency guarentee.
+        # - If set to 'flex', the request will be processed with the Flex Processing
+        #   service tier.
+        #   [Learn more](https://platform.openai.com/docs/guides/flex-processing).
         # - When not set, the default behavior is 'auto'.
         #
         # When this parameter is set, the response body will include the `service_tier`
@@ -598,6 +606,7 @@ module ServiceTier
 
           AUTO = :auto
           DEFAULT = :default
+          FLEX = :flex
 
           finalize!
 
@@ -606,6 +615,8 @@ module ServiceTier
           #   def self.values; end
         end
 
+        # Not supported with latest reasoning models `o3` and `o4-mini`.
+        #
         # Up to 4 sequences where the API will stop generating further tokens. The
         # returned text will not contain the stop sequence.
         module Stop
 
@@ -11,6 +11,10 @@ module ChatModel
       GPT_4_1_2025_04_14 = :"gpt-4.1-2025-04-14"
       GPT_4_1_MINI_2025_04_14 = :"gpt-4.1-mini-2025-04-14"
       GPT_4_1_NANO_2025_04_14 = :"gpt-4.1-nano-2025-04-14"
+      O4_MINI = :"o4-mini"
+      O4_MINI_2025_04_16 = :"o4-mini-2025-04-16"
+      O3 = :o3
+      O3_2025_04_16 = :"o3-2025-04-16"
       O3_MINI = :"o3-mini"
       O3_MINI_2025_01_31 = :"o3-mini-2025-01-31"
       O1 = :o1
 
@@ -133,6 +133,8 @@ class CompletionCreateParams < OpenAI::Internal::Type::BaseModel
       optional :seed, Integer, nil?: true
 
       # @!attribute stop
+      #   Not supported with latest reasoning models `o3` and `o4-mini`.
+      #
       #   Up to 4 sequences where the API will stop generating further tokens. The
       #   returned text will not contain the stop sequence.
       #
@@ -288,6 +290,8 @@ module Prompt
         ArrayOfToken2DArray = OpenAI::Internal::Type::ArrayOf[OpenAI::Internal::Type::ArrayOf[Integer]]
       end
 
+      # Not supported with latest reasoning models `o3` and `o4-mini`.
+      #
       # Up to 4 sequences where the API will stop generating further tokens. The
       # returned text will not contain the stop sequence.
       module Stop
 
@@ -15,15 +15,23 @@ class Reasoning < OpenAI::Internal::Type::BaseModel
       optional :effort, enum: -> { OpenAI::Models::ReasoningEffort }, nil?: true
 
       # @!attribute generate_summary
-      #   **computer_use_preview only**
+      #   **Deprecated:** use `summary` instead.
       #
       #   A summary of the reasoning performed by the model. This can be useful for
-      #   debugging and understanding the model's reasoning process. One of `concise` or
-      #   `detailed`.
+      #   debugging and understanding the model's reasoning process. One of `auto`,
+      #   `concise`, or `detailed`.
       #
       #   @return [Symbol, OpenAI::Models::Reasoning::GenerateSummary, nil]
       optional :generate_summary, enum: -> { OpenAI::Models::Reasoning::GenerateSummary }, nil?: true
 
+      # @!attribute summary
+      #   A summary of the reasoning performed by the model. This can be useful for
+      #   debugging and understanding the model's reasoning process. One of `auto`,
+      #   `concise`, or `detailed`.
+      #
+      #   @return [Symbol, OpenAI::Models::Reasoning::Summary, nil]
+      optional :summary, enum: -> { OpenAI::Models::Reasoning::Summary }, nil?: true
+
       # @!parse
       #   # **o-series models only**
       #   #
@@ -32,21 +40,44 @@ class Reasoning < OpenAI::Internal::Type::BaseModel
       #   #
       #   # @param effort [Symbol, OpenAI::Models::ReasoningEffort, nil]
       #   # @param generate_summary [Symbol, OpenAI::Models::Reasoning::GenerateSummary, nil]
+      #   # @param summary [Symbol, OpenAI::Models::Reasoning::Summary, nil]
       #   #
-      #   def initialize(effort: nil, generate_summary: nil, **) = super
+      #   def initialize(effort: nil, generate_summary: nil, summary: nil, **) = super
 
       # def initialize: (Hash | OpenAI::Internal::Type::BaseModel) -> void
 
-      # **computer_use_preview only**
+      # @deprecated
+      #
+      # **Deprecated:** use `summary` instead.
       #
       # A summary of the reasoning performed by the model. This can be useful for
-      # debugging and understanding the model's reasoning process. One of `concise` or
-      # `detailed`.
+      # debugging and understanding the model's reasoning process. One of `auto`,
+      # `concise`, or `detailed`.
       #
       # @see OpenAI::Models::Reasoning#generate_summary
       module GenerateSummary
         extend OpenAI::Internal::Type::Enum
 
+        AUTO = :auto
+        CONCISE = :concise
+        DETAILED = :detailed
+
+        finalize!
+
+        # @!parse
+        #   # @return [Array<Symbol>]
+        #   def self.values; end
+      end
+
+      # A summary of the reasoning performed by the model. This can be useful for
+      # debugging and understanding the model's reasoning process. One of `auto`,
+      # `concise`, or `detailed`.
+      #
+      # @see OpenAI::Models::Reasoning#summary
+      module Summary
+        extend OpenAI::Internal::Type::Enum
+
+        AUTO = :auto
         CONCISE = :concise
         DETAILED = :detailed