feat(api): responses x eval api

stainless-app[bot] · stainless-app[bot] · commit ea1d56c979ad · 2025-05-16T12:11:58.000-05:00
diff --git a/.stats.yml b/.stats.yml
@@ -1,4 +1,4 @@
 configured_endpoints: 101
-openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-794a6ed3c3d3d77887564755168056af8a426b17cf1ec721e3a300503dc22a41.yml
-openapi_spec_hash: 25a81c220713cd5b0bafc221d1dfa79a
-config_hash: 0b768ed1b56c6d82816f0fa40dc4aaf5
+openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-161ca7f1cfd7b33c1fc07d0ce25dfe4be5a7271c394f4cb526b7fb21b0729900.yml
+openapi_spec_hash: 602e14add4bee018c6774e320ce309b8
+config_hash: 7da27f7260075e8813ddcea542fba1bf
diff --git a/api.md b/api.md
@@ -709,6 +709,7 @@ Methods:
 Types:
 
 - <code><a href="./src/resources/evals/evals.ts">EvalCustomDataSourceConfig</a></code>
+- <code><a href="./src/resources/evals/evals.ts">EvalLogsDataSourceConfig</a></code>
 - <code><a href="./src/resources/evals/evals.ts">EvalStoredCompletionsDataSourceConfig</a></code>
 - <code><a href="./src/resources/evals/evals.ts">EvalCreateResponse</a></code>
 - <code><a href="./src/resources/evals/evals.ts">EvalRetrieveResponse</a></code>
@@ -730,6 +731,7 @@ Types:
 
 - <code><a href="./src/resources/evals/runs/runs.ts">CreateEvalCompletionsRunDataSource</a></code>
 - <code><a href="./src/resources/evals/runs/runs.ts">CreateEvalJSONLRunDataSource</a></code>
+- <code><a href="./src/resources/evals/runs/runs.ts">CreateEvalResponsesRunDataSource</a></code>
 - <code><a href="./src/resources/evals/runs/runs.ts">EvalAPIError</a></code>
 - <code><a href="./src/resources/evals/runs/runs.ts">RunCreateResponse</a></code>
 - <code><a href="./src/resources/evals/runs/runs.ts">RunRetrieveResponse</a></code>
diff --git a/src/index.ts b/src/index.ts
@@ -74,6 +74,7 @@ import {
   EvalListParams,
   EvalListResponse,
   EvalListResponsesPage,
+  EvalLogsDataSourceConfig,
   EvalRetrieveResponse,
   EvalStoredCompletionsDataSourceConfig,
   EvalUpdateParams,
@@ -533,6 +534,7 @@ export declare namespace OpenAI {
   export {
     Evals as Evals,
     type EvalCustomDataSourceConfig as EvalCustomDataSourceConfig,
+    type EvalLogsDataSourceConfig as EvalLogsDataSourceConfig,
     type EvalStoredCompletionsDataSourceConfig as EvalStoredCompletionsDataSourceConfig,
     type EvalCreateResponse as EvalCreateResponse,
     type EvalRetrieveResponse as EvalRetrieveResponse,
diff --git a/src/resources/audio/transcriptions.ts b/src/resources/audio/transcriptions.ts
@@ -324,6 +324,14 @@ export interface TranscriptionCreateParamsBase<
    */
   model: (string & {}) | AudioAPI.AudioModel;
 
+  /**
+   * Controls how the audio is cut into chunks. When set to `"auto"`, the server
+   * first normalizes loudness and then uses voice activity detection (VAD) to choose
+   * boundaries. `server_vad` object can be provided to tweak VAD detection
+   * parameters manually. If unset, the audio is transcribed as a single block.
+   */
+  chunking_strategy?: 'auto' | TranscriptionCreateParams.VadConfig | null;
+
   /**
    * Additional information to include in the transcription response. `logprobs` will
    * return the log probabilities of the tokens in the response to understand the
@@ -387,6 +395,32 @@ export interface TranscriptionCreateParamsBase<
 }
 
 export namespace TranscriptionCreateParams {
+  export interface VadConfig {
+    /**
+     * Must be set to `server_vad` to enable manual chunking using server side VAD.
+     */
+    type: 'server_vad';
+
+    /**
+     * Amount of audio to include before the VAD detected speech (in milliseconds).
+     */
+    prefix_padding_ms?: number;
+
+    /**
+     * Duration of silence to detect speech stop (in milliseconds). With shorter values
+     * the model will respond more quickly, but may jump in on short pauses from the
+     * user.
+     */
+    silence_duration_ms?: number;
+
+    /**
+     * Sensitivity threshold (0.0 to 1.0) for voice activity detection. A higher
+     * threshold will require louder audio to activate the model, and thus might
+     * perform better in noisy environments.
+     */
+    threshold?: number;
+  }
+
   export type TranscriptionCreateParamsNonStreaming = TranscriptionsAPI.TranscriptionCreateParamsNonStreaming;
   export type TranscriptionCreateParamsStreaming = TranscriptionsAPI.TranscriptionCreateParamsStreaming;
 }
diff --git a/src/resources/embeddings.ts b/src/resources/embeddings.ts
@@ -130,11 +130,12 @@ export interface EmbeddingCreateParams {
    * Input text to embed, encoded as a string or array of tokens. To embed multiple
    * inputs in a single request, pass an array of strings or array of token arrays.
    * The input must not exceed the max input tokens for the model (8192 tokens for
-   * `text-embedding-ada-002`), cannot be an empty string, and any array must be 2048
+   * all embedding models), cannot be an empty string, and any array must be 2048
    * dimensions or less.
    * [Example Python code](https://cookbook.openai.com/examples/how_to_count_tokens_with_tiktoken)
-   * for counting tokens. Some models may also impose a limit on total number of
-   * tokens summed across inputs.
+   * for counting tokens. In addition to the per-input token limit, all embedding
+   * models enforce a maximum of 300,000 tokens summed across all inputs in a single
+   * request.
    */
   input: string | Array<string> | Array<number> | Array<Array<number>>;
 
diff --git a/src/resources/evals/evals.ts b/src/resources/evals/evals.ts
@@ -10,6 +10,7 @@ import * as RunsAPI from './runs/runs';
 import {
   CreateEvalCompletionsRunDataSource,
   CreateEvalJSONLRunDataSource,
+  CreateEvalResponsesRunDataSource,
   EvalAPIError,
   RunCancelResponse,
   RunCreateParams,
@@ -105,11 +106,37 @@ export interface EvalCustomDataSourceConfig {
 }
 
 /**
- * A StoredCompletionsDataSourceConfig which specifies the metadata property of
- * your stored completions query. This is usually metadata like `usecase=chatbot`
- * or `prompt-version=v2`, etc. The schema returned by this data source config is
- * used to defined what variables are available in your evals. `item` and `sample`
- * are both defined when using this data source config.
+ * A LogsDataSourceConfig which specifies the metadata property of your logs query.
+ * This is usually metadata like `usecase=chatbot` or `prompt-version=v2`, etc. The
+ * schema returned by this data source config is used to defined what variables are
+ * available in your evals. `item` and `sample` are both defined when using this
+ * data source config.
+ */
+export interface EvalLogsDataSourceConfig {
+  /**
+   * The json schema for the run data source items. Learn how to build JSON schemas
+   * [here](https://json-schema.org/).
+   */
+  schema: Record<string, unknown>;
+
+  /**
+   * The type of data source. Always `logs`.
+   */
+  type: 'logs';
+
+  /**
+   * Set of 16 key-value pairs that can be attached to an object. This can be useful
+   * for storing additional information about the object in a structured format, and
+   * querying for objects via API or the dashboard.
+   *
+   * Keys are strings with a maximum length of 64 characters. Values are strings with
+   * a maximum length of 512 characters.
+   */
+  metadata?: Shared.Metadata | null;
+}
+
+/**
+ * @deprecated Deprecated in favor of LogsDataSourceConfig.
  */
 export interface EvalStoredCompletionsDataSourceConfig {
   /**
@@ -119,9 +146,9 @@ export interface EvalStoredCompletionsDataSourceConfig {
   schema: Record<string, unknown>;
 
   /**
-   * The type of data source. Always `stored_completions`.
+   * The type of data source. Always `stored-completions`.
    */
-  type: 'stored_completions';
+  type: 'stored-completions';
 
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -156,7 +183,10 @@ export interface EvalCreateResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalLogsDataSourceConfig
+    | EvalStoredCompletionsDataSourceConfig;
 
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -244,7 +274,10 @@ export interface EvalRetrieveResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalLogsDataSourceConfig
+    | EvalStoredCompletionsDataSourceConfig;
 
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -332,7 +365,10 @@ export interface EvalUpdateResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalLogsDataSourceConfig
+    | EvalStoredCompletionsDataSourceConfig;
 
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -420,7 +456,10 @@ export interface EvalListResponse {
   /**
    * Configuration of data sources used in runs of the evaluation.
    */
-  data_source_config: EvalCustomDataSourceConfig | EvalStoredCompletionsDataSourceConfig;
+  data_source_config:
+    | EvalCustomDataSourceConfig
+    | EvalLogsDataSourceConfig
+    | EvalStoredCompletionsDataSourceConfig;
 
   /**
    * Set of 16 key-value pairs that can be attached to an object. This can be useful
@@ -498,7 +537,7 @@ export interface EvalCreateParams {
   /**
    * The configuration for the data source used for the evaluation runs.
    */
-  data_source_config: EvalCreateParams.Custom | EvalCreateParams.StoredCompletions;
+  data_source_config: EvalCreateParams.Custom | EvalCreateParams.Logs | EvalCreateParams.StoredCompletions;
 
   /**
    * A list of graders for all eval runs in this group.
@@ -555,15 +594,29 @@ export namespace EvalCreateParams {
   }
 
   /**
-   * A data source config which specifies the metadata property of your stored
-   * completions query. This is usually metadata like `usecase=chatbot` or
-   * `prompt-version=v2`, etc.
+   * A data source config which specifies the metadata property of your logs query.
+   * This is usually metadata like `usecase=chatbot` or `prompt-version=v2`, etc.
+   */
+  export interface Logs {
+    /**
+     * The type of data source. Always `logs`.
+     */
+    type: 'logs';
+
+    /**
+     * Metadata filters for the logs data source.
+     */
+    metadata?: Record<string, unknown>;
+  }
+
+  /**
+   * Deprecated in favor of LogsDataSourceConfig.
    */
   export interface StoredCompletions {
     /**
-     * The type of data source. Always `stored_completions`.
+     * The type of data source. Always `stored-completions`.
      */
-    type: 'stored_completions';
+    type: 'stored-completions';
 
     /**
      * Metadata filters for the stored completions data source.
@@ -733,6 +786,7 @@ Evals.RunListResponsesPage = RunListResponsesPage;
 export declare namespace Evals {
   export {
     type EvalCustomDataSourceConfig as EvalCustomDataSourceConfig,
+    type EvalLogsDataSourceConfig as EvalLogsDataSourceConfig,
     type EvalStoredCompletionsDataSourceConfig as EvalStoredCompletionsDataSourceConfig,
     type EvalCreateResponse as EvalCreateResponse,
     type EvalRetrieveResponse as EvalRetrieveResponse,
@@ -749,6 +803,7 @@ export declare namespace Evals {
     Runs as Runs,
     type CreateEvalCompletionsRunDataSource as CreateEvalCompletionsRunDataSource,
     type CreateEvalJSONLRunDataSource as CreateEvalJSONLRunDataSource,
+    type CreateEvalResponsesRunDataSource as CreateEvalResponsesRunDataSource,
     type EvalAPIError as EvalAPIError,
     type RunCreateResponse as RunCreateResponse,
     type RunRetrieveResponse as RunRetrieveResponse,
diff --git a/src/resources/evals/index.ts b/src/resources/evals/index.ts
@@ -4,6 +4,7 @@ export {
   EvalListResponsesPage,
   Evals,
   type EvalCustomDataSourceConfig,
+  type EvalLogsDataSourceConfig,
   type EvalStoredCompletionsDataSourceConfig,
   type EvalCreateResponse,
   type EvalRetrieveResponse,
@@ -19,6 +20,7 @@ export {
   Runs,
   type CreateEvalCompletionsRunDataSource,
   type CreateEvalJSONLRunDataSource,
+  type CreateEvalResponsesRunDataSource,
   type EvalAPIError,
   type RunCreateResponse,
   type RunRetrieveResponse,
diff --git a/src/resources/evals/runs/index.ts b/src/resources/evals/runs/index.ts
@@ -12,6 +12,7 @@ export {
   Runs,
   type CreateEvalCompletionsRunDataSource,
   type CreateEvalJSONLRunDataSource,
+  type CreateEvalResponsesRunDataSource,
   type EvalAPIError,
   type RunCreateResponse,
   type RunRetrieveResponse,
diff --git a/src/resources/evals/runs/runs.ts b/src/resources/evals/runs/runs.ts
diff --git a/src/resources/fine-tuning/jobs/jobs.ts b/src/resources/fine-tuning/jobs/jobs.ts
diff --git a/src/resources/index.ts b/src/resources/index.ts
diff --git a/tests/api-resources/audio/transcriptions.test.ts b/tests/api-resources/audio/transcriptions.test.ts