feat(api): Add tools and structured outputs to evals

stainless-app[bot] · stainless-app[bot] · commit 64844f1be2da · 2025-06-09T15:47:33.000Z
diff --git a/.stats.yml b/.stats.yml
@@ -1,4 +1,4 @@
 configured_endpoints: 111
-openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-0205acb1015d29b2312a48526734c0399f93026d4fe2dff5c7768f566e333fd2.yml
-openapi_spec_hash: 1772cc9056c2f6dfb2a4e9cb77ee6343
+openapi_spec_url: https://storage.googleapis.com/stainless-sdk-openapi-specs/openai%2Fopenai-4865dda2b62927bd141cbc85f81be3d88602f103e2c581e15eb1caded3e3aaa2.yml
+openapi_spec_hash: 7d14a9b23ef4ac93ea46d629601b6f6b
 config_hash: ed1e6b3c5f93d12b80d31167f55c557c
diff --git a/src/resources/evals/runs/runs.ts b/src/resources/evals/runs/runs.ts
@@ -3,6 +3,7 @@
 import { APIResource } from '../../../core/resource';
 import * as Shared from '../../shared';
 import * as ResponsesAPI from '../../responses/responses';
+import * as CompletionsAPI from '../../chat/completions/completions';
 import * as OutputItemsAPI from './output-items';
 import {
   OutputItemListParams,
@@ -257,6 +258,23 @@ export namespace CreateEvalCompletionsRunDataSource {
      */
     max_completion_tokens?: number;
 
+    /**
+     * An object specifying the format that the model must output.
+     *
+     * Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured
+     * Outputs which ensures the model will match your supplied JSON schema. Learn more
+     * in the
+     * [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).
+     *
+     * Setting to `{ "type": "json_object" }` enables the older JSON mode, which
+     * ensures the message the model generates is valid JSON. Using `json_schema` is
+     * preferred for models that support it.
+     */
+    response_format?:
+      | Shared.ResponseFormatText
+      | Shared.ResponseFormatJSONSchema
+      | Shared.ResponseFormatJSONObject;
+
     /**
      * A seed value to initialize the randomness, during sampling.
      */
@@ -267,6 +285,13 @@ export namespace CreateEvalCompletionsRunDataSource {
      */
     temperature?: number;
 
+    /**
+     * A list of tools the model may call. Currently, only functions are supported as a
+     * tool. Use this to provide a list of functions the model may generate JSON inputs
+     * for. A max of 128 functions are supported.
+     */
+    tools?: Array<CompletionsAPI.ChatCompletionTool>;
+
     /**
      * An alternative to temperature for nucleus sampling; 1.0 includes all tokens.
      */
@@ -649,11 +674,66 @@ export namespace RunCreateResponse {
        */
       temperature?: number;
 
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      text?: SamplingParams.Text;
+
+      /**
+       * An array of tools the model may call while generating a response. You can
+       * specify which tool to use by setting the `tool_choice` parameter.
+       *
+       * The two categories of tools you can provide the model are:
+       *
+       * - **Built-in tools**: Tools that are provided by OpenAI that extend the model's
+       *   capabilities, like
+       *   [web search](https://platform.openai.com/docs/guides/tools-web-search) or
+       *   [file search](https://platform.openai.com/docs/guides/tools-file-search).
+       *   Learn more about
+       *   [built-in tools](https://platform.openai.com/docs/guides/tools).
+       * - **Function calls (custom tools)**: Functions that are defined by you, enabling
+       *   the model to call your own code. Learn more about
+       *   [function calling](https://platform.openai.com/docs/guides/function-calling).
+       */
+      tools?: Array<ResponsesAPI.Tool>;
+
       /**
        * An alternative to temperature for nucleus sampling; 1.0 includes all tokens.
        */
       top_p?: number;
     }
+
+    export namespace SamplingParams {
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      export interface Text {
+        /**
+         * An object specifying the format that the model must output.
+         *
+         * Configuring `{ "type": "json_schema" }` enables Structured Outputs, which
+         * ensures the model will match your supplied JSON schema. Learn more in the
+         * [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).
+         *
+         * The default format is `{ "type": "text" }` with no additional options.
+         *
+         * **Not recommended for gpt-4o and newer models:**
+         *
+         * Setting to `{ "type": "json_object" }` enables the older JSON mode, which
+         * ensures the message the model generates is valid JSON. Using `json_schema` is
+         * preferred for models that support it.
+         */
+        format?: ResponsesAPI.ResponseFormatTextConfig;
+      }
+    }
   }
 
   export interface PerModelUsage {
@@ -1041,11 +1121,66 @@ export namespace RunRetrieveResponse {
        */
       temperature?: number;
 
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      text?: SamplingParams.Text;
+
+      /**
+       * An array of tools the model may call while generating a response. You can
+       * specify which tool to use by setting the `tool_choice` parameter.
+       *
+       * The two categories of tools you can provide the model are:
+       *
+       * - **Built-in tools**: Tools that are provided by OpenAI that extend the model's
+       *   capabilities, like
+       *   [web search](https://platform.openai.com/docs/guides/tools-web-search) or
+       *   [file search](https://platform.openai.com/docs/guides/tools-file-search).
+       *   Learn more about
+       *   [built-in tools](https://platform.openai.com/docs/guides/tools).
+       * - **Function calls (custom tools)**: Functions that are defined by you, enabling
+       *   the model to call your own code. Learn more about
+       *   [function calling](https://platform.openai.com/docs/guides/function-calling).
+       */
+      tools?: Array<ResponsesAPI.Tool>;
+
       /**
        * An alternative to temperature for nucleus sampling; 1.0 includes all tokens.
        */
       top_p?: number;
     }
+
+    export namespace SamplingParams {
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      export interface Text {
+        /**
+         * An object specifying the format that the model must output.
+         *
+         * Configuring `{ "type": "json_schema" }` enables Structured Outputs, which
+         * ensures the model will match your supplied JSON schema. Learn more in the
+         * [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).
+         *
+         * The default format is `{ "type": "text" }` with no additional options.
+         *
+         * **Not recommended for gpt-4o and newer models:**
+         *
+         * Setting to `{ "type": "json_object" }` enables the older JSON mode, which
+         * ensures the message the model generates is valid JSON. Using `json_schema` is
+         * preferred for models that support it.
+         */
+        format?: ResponsesAPI.ResponseFormatTextConfig;
+      }
+    }
   }
 
   export interface PerModelUsage {
@@ -1430,11 +1565,66 @@ export namespace RunListResponse {
        */
       temperature?: number;
 
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      text?: SamplingParams.Text;
+
+      /**
+       * An array of tools the model may call while generating a response. You can
+       * specify which tool to use by setting the `tool_choice` parameter.
+       *
+       * The two categories of tools you can provide the model are:
+       *
+       * - **Built-in tools**: Tools that are provided by OpenAI that extend the model's
+       *   capabilities, like
+       *   [web search](https://platform.openai.com/docs/guides/tools-web-search) or
+       *   [file search](https://platform.openai.com/docs/guides/tools-file-search).
+       *   Learn more about
+       *   [built-in tools](https://platform.openai.com/docs/guides/tools).
+       * - **Function calls (custom tools)**: Functions that are defined by you, enabling
+       *   the model to call your own code. Learn more about
+       *   [function calling](https://platform.openai.com/docs/guides/function-calling).
+       */
+      tools?: Array<ResponsesAPI.Tool>;
+
       /**
        * An alternative to temperature for nucleus sampling; 1.0 includes all tokens.
        */
       top_p?: number;
     }
+
+    export namespace SamplingParams {
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      export interface Text {
+        /**
+         * An object specifying the format that the model must output.
+         *
+         * Configuring `{ "type": "json_schema" }` enables Structured Outputs, which
+         * ensures the model will match your supplied JSON schema. Learn more in the
+         * [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).
+         *
+         * The default format is `{ "type": "text" }` with no additional options.
+         *
+         * **Not recommended for gpt-4o and newer models:**
+         *
+         * Setting to `{ "type": "json_object" }` enables the older JSON mode, which
+         * ensures the message the model generates is valid JSON. Using `json_schema` is
+         * preferred for models that support it.
+         */
+        format?: ResponsesAPI.ResponseFormatTextConfig;
+      }
+    }
   }
 
   export interface PerModelUsage {
@@ -1830,11 +2020,66 @@ export namespace RunCancelResponse {
        */
       temperature?: number;
 
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      text?: SamplingParams.Text;
+
+      /**
+       * An array of tools the model may call while generating a response. You can
+       * specify which tool to use by setting the `tool_choice` parameter.
+       *
+       * The two categories of tools you can provide the model are:
+       *
+       * - **Built-in tools**: Tools that are provided by OpenAI that extend the model's
+       *   capabilities, like
+       *   [web search](https://platform.openai.com/docs/guides/tools-web-search) or
+       *   [file search](https://platform.openai.com/docs/guides/tools-file-search).
+       *   Learn more about
+       *   [built-in tools](https://platform.openai.com/docs/guides/tools).
+       * - **Function calls (custom tools)**: Functions that are defined by you, enabling
+       *   the model to call your own code. Learn more about
+       *   [function calling](https://platform.openai.com/docs/guides/function-calling).
+       */
+      tools?: Array<ResponsesAPI.Tool>;
+
       /**
        * An alternative to temperature for nucleus sampling; 1.0 includes all tokens.
        */
       top_p?: number;
     }
+
+    export namespace SamplingParams {
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      export interface Text {
+        /**
+         * An object specifying the format that the model must output.
+         *
+         * Configuring `{ "type": "json_schema" }` enables Structured Outputs, which
+         * ensures the model will match your supplied JSON schema. Learn more in the
+         * [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).
+         *
+         * The default format is `{ "type": "text" }` with no additional options.
+         *
+         * **Not recommended for gpt-4o and newer models:**
+         *
+         * Setting to `{ "type": "json_object" }` enables the older JSON mode, which
+         * ensures the message the model generates is valid JSON. Using `json_schema` is
+         * preferred for models that support it.
+         */
+        format?: ResponsesAPI.ResponseFormatTextConfig;
+      }
+    }
   }
 
   export interface PerModelUsage {
@@ -2169,11 +2414,66 @@ export namespace RunCreateParams {
        */
       temperature?: number;
 
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      text?: SamplingParams.Text;
+
+      /**
+       * An array of tools the model may call while generating a response. You can
+       * specify which tool to use by setting the `tool_choice` parameter.
+       *
+       * The two categories of tools you can provide the model are:
+       *
+       * - **Built-in tools**: Tools that are provided by OpenAI that extend the model's
+       *   capabilities, like
+       *   [web search](https://platform.openai.com/docs/guides/tools-web-search) or
+       *   [file search](https://platform.openai.com/docs/guides/tools-file-search).
+       *   Learn more about
+       *   [built-in tools](https://platform.openai.com/docs/guides/tools).
+       * - **Function calls (custom tools)**: Functions that are defined by you, enabling
+       *   the model to call your own code. Learn more about
+       *   [function calling](https://platform.openai.com/docs/guides/function-calling).
+       */
+      tools?: Array<ResponsesAPI.Tool>;
+
       /**
        * An alternative to temperature for nucleus sampling; 1.0 includes all tokens.
        */
       top_p?: number;
     }
+
+    export namespace SamplingParams {
+      /**
+       * Configuration options for a text response from the model. Can be plain text or
+       * structured JSON data. Learn more:
+       *
+       * - [Text inputs and outputs](https://platform.openai.com/docs/guides/text)
+       * - [Structured Outputs](https://platform.openai.com/docs/guides/structured-outputs)
+       */
+      export interface Text {
+        /**
+         * An object specifying the format that the model must output.
+         *
+         * Configuring `{ "type": "json_schema" }` enables Structured Outputs, which
+         * ensures the model will match your supplied JSON schema. Learn more in the
+         * [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).
+         *
+         * The default format is `{ "type": "text" }` with no additional options.
+         *
+         * **Not recommended for gpt-4o and newer models:**
+         *
+         * Setting to `{ "type": "json_object" }` enables the older JSON mode, which
+         * ensures the message the model generates is valid JSON. Using `json_schema` is
+         * preferred for models that support it.
+         */
+        format?: ResponsesAPI.ResponseFormatTextConfig;
+      }
+    }
   }
 }