RooCodeInc · daniel-lxs · Aug 13, 2025 · Aug 13, 2025 · Aug 14, 2025 · Aug 14, 2025
@@ -47,6 +47,8 @@ export const modelInfoSchema = z.object({
 	// Capability flag to indicate whether the model supports an output verbosity parameter
 	supportsVerbosity: z.boolean().optional(),
 	supportsReasoningBudget: z.boolean().optional(),
+	// Capability flag to indicate whether the model supports temperature parameter
+	supportsTemperature: z.boolean().optional(),
 	requiredReasoningBudget: z.boolean().optional(),
 	supportsReasoningEffort: z.boolean().optional(),
 	supportedParameters: z.array(modelParametersSchema).optional(),

@@ -19,6 +19,7 @@ export const openAiNativeModels = {
 		description: "GPT-5: The best model for coding and agentic tasks across domains",
 		// supportsVerbosity is a new capability; ensure ModelInfo includes it
 		supportsVerbosity: true,
+		supportsTemperature: false,
 	},
 	"gpt-5-mini-2025-08-07": {
 		maxTokens: 128000,
@@ -32,6 +33,7 @@ export const openAiNativeModels = {
 		cacheReadsPrice: 0.03,
 		description: "GPT-5 Mini: A faster, more cost-efficient version of GPT-5 for well-defined tasks",
 		supportsVerbosity: true,
+		supportsTemperature: false,
 	},
 	"gpt-5-nano-2025-08-07": {
 		maxTokens: 128000,
@@ -45,6 +47,7 @@ export const openAiNativeModels = {
 		cacheReadsPrice: 0.01,
 		description: "GPT-5 Nano: Fastest, most cost-efficient version of GPT-5",
 		supportsVerbosity: true,
+		supportsTemperature: false,
 	},
 	"gpt-4.1": {
 		maxTokens: 32_768,
@@ -54,6 +57,7 @@ export const openAiNativeModels = {
 		inputPrice: 2,
 		outputPrice: 8,
 		cacheReadsPrice: 0.5,
+		supportsTemperature: true,
 	},
 	"gpt-4.1-mini": {
 		maxTokens: 32_768,
@@ -63,6 +67,7 @@ export const openAiNativeModels = {
 		inputPrice: 0.4,
 		outputPrice: 1.6,
 		cacheReadsPrice: 0.1,
+		supportsTemperature: true,
 	},
 	"gpt-4.1-nano": {
 		maxTokens: 32_768,
@@ -72,6 +77,7 @@ export const openAiNativeModels = {
 		inputPrice: 0.1,
 		outputPrice: 0.4,
 		cacheReadsPrice: 0.025,
+		supportsTemperature: true,
 	},
 	o3: {
 		maxTokens: 100_000,
@@ -83,6 +89,7 @@ export const openAiNativeModels = {
 		cacheReadsPrice: 0.5,
 		supportsReasoningEffort: true,
 		reasoningEffort: "medium",
+		supportsTemperature: false,
 	},
 	"o3-high": {
 		maxTokens: 100_000,
@@ -93,6 +100,7 @@ export const openAiNativeModels = {
 		outputPrice: 8.0,
 		cacheReadsPrice: 0.5,
 		reasoningEffort: "high",
+		supportsTemperature: false,
 	},
 	"o3-low": {
 		maxTokens: 100_000,
@@ -103,6 +111,7 @@ export const openAiNativeModels = {
 		outputPrice: 8.0,
 		cacheReadsPrice: 0.5,
 		reasoningEffort: "low",
+		supportsTemperature: false,
 	},
 	"o4-mini": {
 		maxTokens: 100_000,
@@ -114,6 +123,7 @@ export const openAiNativeModels = {
 		cacheReadsPrice: 0.275,
 		supportsReasoningEffort: true,
 		reasoningEffort: "medium",
+		supportsTemperature: false,
 	},
 	"o4-mini-high": {
 		maxTokens: 100_000,
@@ -124,6 +134,7 @@ export const openAiNativeModels = {
 		outputPrice: 4.4,
 		cacheReadsPrice: 0.275,
 		reasoningEffort: "high",
+		supportsTemperature: false,
 	},
 	"o4-mini-low": {
 		maxTokens: 100_000,
@@ -134,6 +145,7 @@ export const openAiNativeModels = {
 		outputPrice: 4.4,
 		cacheReadsPrice: 0.275,
 		reasoningEffort: "low",
+		supportsTemperature: false,
 	},
 	"o3-mini": {
 		maxTokens: 100_000,
@@ -145,6 +157,7 @@ export const openAiNativeModels = {
 		cacheReadsPrice: 0.55,
 		supportsReasoningEffort: true,
 		reasoningEffort: "medium",
+		supportsTemperature: false,
 	},
 	"o3-mini-high": {
 		maxTokens: 100_000,
@@ -155,6 +168,7 @@ export const openAiNativeModels = {
 		outputPrice: 4.4,
 		cacheReadsPrice: 0.55,
 		reasoningEffort: "high",
+		supportsTemperature: false,
 	},
 	"o3-mini-low": {
 		maxTokens: 100_000,
@@ -165,6 +179,7 @@ export const openAiNativeModels = {
 		outputPrice: 4.4,
 		cacheReadsPrice: 0.55,
 		reasoningEffort: "low",
+		supportsTemperature: false,
 	},
 	o1: {
 		maxTokens: 100_000,
@@ -174,6 +189,7 @@ export const openAiNativeModels = {
 		inputPrice: 15,
 		outputPrice: 60,
 		cacheReadsPrice: 7.5,
+		supportsTemperature: false,
 	},
 	"o1-preview": {
 		maxTokens: 32_768,
@@ -183,6 +199,7 @@ export const openAiNativeModels = {
 		inputPrice: 15,
 		outputPrice: 60,
 		cacheReadsPrice: 7.5,
+		supportsTemperature: false,
 	},
 	"o1-mini": {
 		maxTokens: 65_536,
@@ -192,6 +209,7 @@ export const openAiNativeModels = {
 		inputPrice: 1.1,
 		outputPrice: 4.4,
 		cacheReadsPrice: 0.55,
+		supportsTemperature: false,
 	},
 	"gpt-4o": {
 		maxTokens: 16_384,
@@ -201,6 +219,7 @@ export const openAiNativeModels = {
 		inputPrice: 2.5,
 		outputPrice: 10,
 		cacheReadsPrice: 1.25,
+		supportsTemperature: true,
 	},
 	"gpt-4o-mini": {
 		maxTokens: 16_384,
@@ -210,6 +229,7 @@ export const openAiNativeModels = {
 		inputPrice: 0.15,
 		outputPrice: 0.6,
 		cacheReadsPrice: 0.075,
+		supportsTemperature: true,
 	},
 	"codex-mini-latest": {
 		maxTokens: 16_384,
@@ -219,6 +239,7 @@ export const openAiNativeModels = {
 		inputPrice: 1.5,
 		outputPrice: 6,
 		cacheReadsPrice: 0,
+		supportsTemperature: false,
 		description:
 			"Codex Mini: Cloud-based software engineering agent powered by codex-1, a version of o3 optimized for coding tasks. Trained with reinforcement learning to generate human-style code, adhere to instructions, and iteratively run tests.",
 	},

@@ -52,6 +52,14 @@ export interface ApiHandlerCreateMessageMetadata {
 	 * Used to enforce "skip once" after a condense operation.
 	 */
 	suppressPreviousResponseId?: boolean
+	/**
+	 * Controls whether the response should be stored for 30 days in OpenAI's Responses API.
+	 * When true (default), responses are stored and can be referenced in future requests
+	 * using the previous_response_id for efficient conversation continuity.
+	 * Set to false to opt out of response storage for privacy or compliance reasons.
+	 * @default true
+	 */
+	store?: boolean
 }
 
 export interface ApiHandler {