From dacbd6cb78ce2097e5080dbc26502bbb4419286a Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Thu, 10 Apr 2025 20:10:30 -0700
Subject: [PATCH 1/8] Specify reasoning effort for OpenRouter reasoning models

---
 src/api/index.ts                              |  6 ++-
 src/api/providers/openrouter.ts               | 15 +++++--
 src/exports/roo-code.d.ts                     |  3 +-
 src/exports/types.ts                          |  3 +-
 src/schemas/index.ts                          |  6 ++-
 .../src/components/settings/ApiOptions.tsx    |  9 +++-
 .../components/settings/ReasoningEffort.tsx   | 45 +++++++++++++++++++
 .../src/components/settings/constants.ts      |  2 +
 8 files changed, 80 insertions(+), 9 deletions(-)
 create mode 100644 webview-ui/src/components/settings/ReasoningEffort.tsx
diff --git a/src/api/index.ts b/src/api/index.ts
index 0880f42218..c6d2b07cd2 100644
--- a/src/api/index.ts
+++ b/src/api/index.ts
@@ -88,21 +88,25 @@ export function getModelParams({
 	model,
 	defaultMaxTokens,
 	defaultTemperature = 0,
+	defaultReasoningEffort,
 }: {
 	options: ApiHandlerOptions
 	model: ModelInfo
 	defaultMaxTokens?: number
 	defaultTemperature?: number
+	defaultReasoningEffort?: "low" | "medium" | "high"
 }) {
 	const {
 		modelMaxTokens: customMaxTokens,
 		modelMaxThinkingTokens: customMaxThinkingTokens,
 		modelTemperature: customTemperature,
+		reasoningEffort: customReasoningEffort,
 	} = options
 
 	let maxTokens = model.maxTokens ?? defaultMaxTokens
 	let thinking: BetaThinkingConfigParam | undefined = undefined
 	let temperature = customTemperature ?? defaultTemperature
+	const reasoningEffort = customReasoningEffort ?? defaultReasoningEffort
 
 	if (model.thinking) {
 		// Only honor `customMaxTokens` for thinking models.
@@ -118,5 +122,5 @@ export function getModelParams({
 		temperature = 1.0
 	}
 
-	return { maxTokens, thinking, temperature }
+	return { maxTokens, thinking, temperature, reasoningEffort }
 }
diff --git a/src/api/providers/openrouter.ts b/src/api/providers/openrouter.ts
index 72e4fe576a..2a279d09a1 100644
--- a/src/api/providers/openrouter.ts
+++ b/src/api/providers/openrouter.ts
@@ -1,8 +1,7 @@
 import { Anthropic } from "@anthropic-ai/sdk"
 import { BetaThinkingConfigParam } from "@anthropic-ai/sdk/resources/beta"
-import axios, { AxiosRequestConfig } from "axios"
+import axios from "axios"
 import OpenAI from "openai"
-import delay from "delay"
 
 import { ApiHandlerOptions, ModelInfo, openRouterDefaultModelId, openRouterDefaultModelInfo } from "../../shared/api"
 import { parseApiPrice } from "../../utils/cost"
@@ -22,6 +21,12 @@ type OpenRouterChatCompletionParams = OpenAI.Chat.ChatCompletionCreateParams & {
 	transforms?: string[]
 	include_reasoning?: boolean
 	thinking?: BetaThinkingConfigParam
+	// https://openrouter.ai/docs/use-cases/reasoning-tokens
+	reasoning?: {
+		effort?: "high" | "medium" | "low"
+		max_tokens?: number
+		exclude?: boolean
+	}
 }
 
 export class OpenRouterHandler extends BaseProvider implements SingleCompletionHandler {
@@ -42,7 +47,7 @@ export class OpenRouterHandler extends BaseProvider implements SingleCompletionH
 		systemPrompt: string,
 		messages: Anthropic.Messages.MessageParam[],
 	): AsyncGenerator<ApiStreamChunk> {
-		let { id: modelId, maxTokens, thinking, temperature, topP } = this.getModel()
+		let { id: modelId, maxTokens, thinking, temperature, topP, reasoningEffort } = this.getModel()
 
 		// Convert Anthropic messages to OpenAI format.
 		let openAiMessages: OpenAI.Chat.ChatCompletionMessageParam[] = [
@@ -70,13 +75,16 @@ export class OpenRouterHandler extends BaseProvider implements SingleCompletionH
 						},
 					],
 				}
+
 				// Add cache_control to the last two user messages
 				// (note: this works because we only ever add one user message at a time, but if we added multiple we'd need to mark the user message before the last assistant message)
 				const lastTwoUserMessages = openAiMessages.filter((msg) => msg.role === "user").slice(-2)
+
 				lastTwoUserMessages.forEach((msg) => {
 					if (typeof msg.content === "string") {
 						msg.content = [{ type: "text", text: msg.content }]
 					}
+
 					if (Array.isArray(msg.content)) {
 						// NOTE: this is fine since env details will always be added at the end. but if it weren't there, and the user added a image_url type message, it would pop a text part before it and then move it after to the end.
 						let lastTextPart = msg.content.filter((part) => part.type === "text").pop()
@@ -113,6 +121,7 @@ export class OpenRouterHandler extends BaseProvider implements SingleCompletionH
 				}),
 			// This way, the transforms field will only be included in the parameters when openRouterUseMiddleOutTransform is true.
 			...((this.options.openRouterUseMiddleOutTransform ?? true) && { transforms: ["middle-out"] }),
+			...(reasoningEffort && { reasoning: { effort: reasoningEffort } }),
 		}
 
 		const stream = await this.client.chat.completions.create(completionParams)
diff --git a/src/exports/roo-code.d.ts b/src/exports/roo-code.d.ts
index 40939e4e32..95117083d8 100644
--- a/src/exports/roo-code.d.ts
+++ b/src/exports/roo-code.d.ts
@@ -175,10 +175,11 @@ type ProviderSettings = {
 				cachableFields?: string[] | undefined
 		  } | null)
 		| undefined
-	modelTemperature?: (number | null) | undefined
 	modelMaxTokens?: number | undefined
 	modelMaxThinkingTokens?: number | undefined
 	includeMaxTokens?: boolean | undefined
+	modelTemperature?: (number | null) | undefined
+	reasoningEffort?: ("low" | "medium" | "high") | undefined
 	rateLimitSeconds?: number | undefined
 	fakeAi?: unknown | undefined
 }
diff --git a/src/exports/types.ts b/src/exports/types.ts
index 64a955554e..413172141c 100644
--- a/src/exports/types.ts
+++ b/src/exports/types.ts
@@ -176,10 +176,11 @@ type ProviderSettings = {
 				cachableFields?: string[] | undefined
 		  } | null)
 		| undefined
-	modelTemperature?: (number | null) | undefined
 	modelMaxTokens?: number | undefined
 	modelMaxThinkingTokens?: number | undefined
 	includeMaxTokens?: boolean | undefined
+	modelTemperature?: (number | null) | undefined
+	reasoningEffort?: ("low" | "medium" | "high") | undefined
 	rateLimitSeconds?: number | undefined
 	fakeAi?: unknown | undefined
 }
diff --git a/src/schemas/index.ts b/src/schemas/index.ts
index d2471882ec..47174c90b7 100644
--- a/src/schemas/index.ts
+++ b/src/schemas/index.ts
@@ -383,11 +383,12 @@ export const providerSettingsSchema = z.object({
 	requestyModelId: z.string().optional(),
 	requestyModelInfo: modelInfoSchema.nullish(),
 	// Claude 3.7 Sonnet Thinking
-	modelTemperature: z.number().nullish(),
 	modelMaxTokens: z.number().optional(),
 	modelMaxThinkingTokens: z.number().optional(),
 	// Generic
 	includeMaxTokens: z.boolean().optional(),
+	modelTemperature: z.number().nullish(),
+	reasoningEffort: z.enum(["low", "medium", "high"]).optional(),
 	rateLimitSeconds: z.number().optional(),
 	// Fake AI
 	fakeAi: z.unknown().optional(),
@@ -470,11 +471,12 @@ const providerSettingsRecord: ProviderSettingsRecord = {
 	requestyModelId: undefined,
 	requestyModelInfo: undefined,
 	// Claude 3.7 Sonnet Thinking
-	modelTemperature: undefined,
 	modelMaxTokens: undefined,
 	modelMaxThinkingTokens: undefined,
 	// Generic
 	includeMaxTokens: undefined,
+	modelTemperature: undefined,
+	reasoningEffort: undefined,
 	rateLimitSeconds: undefined,
 	// Fake AI
 	fakeAi: undefined,
diff --git a/webview-ui/src/components/settings/ApiOptions.tsx b/webview-ui/src/components/settings/ApiOptions.tsx
index 55690d4806..1d76148c10 100644
--- a/webview-ui/src/components/settings/ApiOptions.tsx
+++ b/webview-ui/src/components/settings/ApiOptions.tsx
@@ -46,7 +46,7 @@ import {
 	OPENROUTER_DEFAULT_PROVIDER_NAME,
 } from "@/components/ui/hooks/useOpenRouterModelProviders"
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue, SelectSeparator, Button } from "@/components/ui"
-import { MODELS_BY_PROVIDER, PROVIDERS, VERTEX_REGIONS } from "./constants"
+import { MODELS_BY_PROVIDER, PROVIDERS, VERTEX_REGIONS, REASONING_MODELS } from "./constants"
 import { AWS_REGIONS } from "../../../../src/shared/aws_regions"
 import { VSCodeButtonLink } from "../common/VSCodeButtonLink"
 import { ModelInfoView } from "./ModelInfoView"
@@ -58,6 +58,7 @@ import { ThinkingBudget } from "./ThinkingBudget"
 import { R1FormatSetting } from "./R1FormatSetting"
 import { OpenRouterBalanceDisplay } from "./OpenRouterBalanceDisplay"
 import { RequestyBalanceDisplay } from "./RequestyBalanceDisplay"
+import { ReasoningEffort } from "./ReasoningEffort"
 
 interface ApiOptionsProps {
 	uriScheme: string | undefined
@@ -1519,6 +1520,10 @@ const ApiOptions = ({
 					</div>
 				)}
 
+			{selectedProvider === "openrouter" && REASONING_MODELS.has(selectedModelId) && (
+				<ReasoningEffort setApiConfigurationField={setApiConfigurationField} modelInfo={selectedModelInfo} />
+			)}
+
 			{selectedProvider === "glama" && (
 				<ModelPicker
 					apiConfiguration={apiConfiguration}
@@ -1646,12 +1651,14 @@ const ApiOptions = ({
 								})()}
 						</>
 					)}
+
 					<ModelInfoView
 						selectedModelId={selectedModelId}
 						modelInfo={selectedModelInfo}
 						isDescriptionExpanded={isDescriptionExpanded}
 						setIsDescriptionExpanded={setIsDescriptionExpanded}
 					/>
+
 					<ThinkingBudget
 						key={`${selectedProvider}-${selectedModelId}`}
 						apiConfiguration={apiConfiguration}
diff --git a/webview-ui/src/components/settings/ReasoningEffort.tsx b/webview-ui/src/components/settings/ReasoningEffort.tsx
new file mode 100644
index 0000000000..efe8c427b6
--- /dev/null
+++ b/webview-ui/src/components/settings/ReasoningEffort.tsx
@@ -0,0 +1,45 @@
+import { useAppTranslation } from "@/i18n/TranslationContext"
+
+import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue, SelectSeparator } from "@/components/ui"
+
+import { ApiConfiguration, ModelInfo } from "../../../../src/shared/api"
+
+export const EFFORTS = ["high", "medium", "low"] as const
+
+interface ReasoningEffortProps {
+	setApiConfigurationField: <K extends keyof ApiConfiguration>(field: K, value: ApiConfiguration[K]) => void
+	modelInfo: ModelInfo
+}
+
+export const ReasoningEffort = ({ setApiConfigurationField, modelInfo }: ReasoningEffortProps) => {
+	const { t } = useAppTranslation()
+
+	return (
+		<div className="flex flex-col gap-1">
+			<div className="flex justify-between items-center">
+				<label className="block font-medium mb-1">Model Reasoning Effort</label>
+			</div>
+			<Select
+				value={modelInfo.reasoningEffort}
+				onValueChange={(value) =>
+					setApiConfigurationField("openRouterModelInfo", {
+						...modelInfo,
+						reasoningEffort: value as "high" | "medium" | "low",
+					})
+				}>
+				<SelectTrigger className="w-full">
+					<SelectValue placeholder={t("settings:common.select")} />
+				</SelectTrigger>
+				<SelectContent>
+					<SelectItem value="openrouter">OpenRouter</SelectItem>
+					<SelectSeparator />
+					{EFFORTS.map((value) => (
+						<SelectItem key={value} value={value}>
+							{value}
+						</SelectItem>
+					))}
+				</SelectContent>
+			</Select>
+		</div>
+	)
+}
diff --git a/webview-ui/src/components/settings/constants.ts b/webview-ui/src/components/settings/constants.ts
index 01f24a2ed5..772fe04b5f 100644
--- a/webview-ui/src/components/settings/constants.ts
+++ b/webview-ui/src/components/settings/constants.ts
@@ -46,3 +46,5 @@ export const VERTEX_REGIONS = [
 	{ value: "europe-west4", label: "europe-west4" },
 	{ value: "asia-southeast1", label: "asia-southeast1" },
 ]
+
+export const REASONING_MODELS = new Set(["x-ai/grok-3-mini-beta"])

From e588b3f059ba460ffe3766d3b484afea2047c0a8 Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Thu, 10 Apr 2025 20:13:49 -0700
Subject: [PATCH 2/8] Add ReasoningEffort type

---
 src/schemas/index.ts                               | 14 ++++++++++++--
 .../src/components/settings/ReasoningEffort.tsx    | 10 +++-------
 2 files changed, 15 insertions(+), 9 deletions(-)

diff --git a/src/schemas/index.ts b/src/schemas/index.ts
index 47174c90b7..013f09ac07 100644
--- a/src/schemas/index.ts
+++ b/src/schemas/index.ts
@@ -95,6 +95,16 @@ export const telemetrySettingsSchema = z.enum(telemetrySettings)
 
 export type TelemetrySetting = z.infer<typeof telemetrySettingsSchema>
 
+/**
+ * ReasoningEffort
+ */
+
+export const reasoningEfforts = ["low", "medium", "high"] as const
+
+export const reasoningEffortsSchema = z.enum(reasoningEfforts)
+
+export type ReasoningEffort = z.infer<typeof reasoningEffortsSchema>
+
 /**
  * ModelInfo
  */
@@ -110,7 +120,7 @@ export const modelInfoSchema = z.object({
 	cacheWritesPrice: z.number().optional(),
 	cacheReadsPrice: z.number().optional(),
 	description: z.string().optional(),
-	reasoningEffort: z.enum(["low", "medium", "high"]).optional(),
+	reasoningEffort: reasoningEffortsSchema.optional(),
 	thinking: z.boolean().optional(),
 	minTokensPerCachePoint: z.number().optional(),
 	maxCachePoints: z.number().optional(),
@@ -388,7 +398,7 @@ export const providerSettingsSchema = z.object({
 	// Generic
 	includeMaxTokens: z.boolean().optional(),
 	modelTemperature: z.number().nullish(),
-	reasoningEffort: z.enum(["low", "medium", "high"]).optional(),
+	reasoningEffort: reasoningEffortsSchema.optional(),
 	rateLimitSeconds: z.number().optional(),
 	// Fake AI
 	fakeAi: z.unknown().optional(),
diff --git a/webview-ui/src/components/settings/ReasoningEffort.tsx b/webview-ui/src/components/settings/ReasoningEffort.tsx
index efe8c427b6..5b5b877c3a 100644
--- a/webview-ui/src/components/settings/ReasoningEffort.tsx
+++ b/webview-ui/src/components/settings/ReasoningEffort.tsx
@@ -3,8 +3,7 @@ import { useAppTranslation } from "@/i18n/TranslationContext"
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue, SelectSeparator } from "@/components/ui"
 
 import { ApiConfiguration, ModelInfo } from "../../../../src/shared/api"
-
-export const EFFORTS = ["high", "medium", "low"] as const
+import { reasoningEfforts } from "../../../../src/schemas"
 
 interface ReasoningEffortProps {
 	setApiConfigurationField: <K extends keyof ApiConfiguration>(field: K, value: ApiConfiguration[K]) => void
@@ -22,10 +21,7 @@ export const ReasoningEffort = ({ setApiConfigurationField, modelInfo }: Reasoni
 			<Select
 				value={modelInfo.reasoningEffort}
 				onValueChange={(value) =>
-					setApiConfigurationField("openRouterModelInfo", {
-						...modelInfo,
-						reasoningEffort: value as "high" | "medium" | "low",
-					})
+					setApiConfigurationField("reasoningEffort", value as "high" | "medium" | "low")
 				}>
 				<SelectTrigger className="w-full">
 					<SelectValue placeholder={t("settings:common.select")} />
@@ -33,7 +29,7 @@ export const ReasoningEffort = ({ setApiConfigurationField, modelInfo }: Reasoni
 				<SelectContent>
 					<SelectItem value="openrouter">OpenRouter</SelectItem>
 					<SelectSeparator />
-					{EFFORTS.map((value) => (
+					{reasoningEfforts.map((value) => (
 						<SelectItem key={value} value={value}>
 							{value}
 						</SelectItem>

From 7659be07ba547116c61ced7eb2138ebfd10a6696 Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Thu, 10 Apr 2025 20:17:08 -0700
Subject: [PATCH 3/8] Fix ReasoningEffort props

---
 webview-ui/src/components/settings/ApiOptions.tsx      | 5 ++++-
 webview-ui/src/components/settings/ReasoningEffort.tsx | 8 ++++----
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/webview-ui/src/components/settings/ApiOptions.tsx b/webview-ui/src/components/settings/ApiOptions.tsx
index 1d76148c10..c0e116cabb 100644
--- a/webview-ui/src/components/settings/ApiOptions.tsx
+++ b/webview-ui/src/components/settings/ApiOptions.tsx
@@ -1521,7 +1521,10 @@ const ApiOptions = ({
 				)}
 
 			{selectedProvider === "openrouter" && REASONING_MODELS.has(selectedModelId) && (
-				<ReasoningEffort setApiConfigurationField={setApiConfigurationField} modelInfo={selectedModelInfo} />
+				<ReasoningEffort
+					apiConfiguration={apiConfiguration}
+					setApiConfigurationField={setApiConfigurationField}
+				/>
 			)}
 
 			{selectedProvider === "glama" && (
diff --git a/webview-ui/src/components/settings/ReasoningEffort.tsx b/webview-ui/src/components/settings/ReasoningEffort.tsx
index 5b5b877c3a..5ffb6682be 100644
--- a/webview-ui/src/components/settings/ReasoningEffort.tsx
+++ b/webview-ui/src/components/settings/ReasoningEffort.tsx
@@ -2,15 +2,15 @@ import { useAppTranslation } from "@/i18n/TranslationContext"
 
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue, SelectSeparator } from "@/components/ui"
 
-import { ApiConfiguration, ModelInfo } from "../../../../src/shared/api"
+import { ApiConfiguration } from "../../../../src/shared/api"
 import { reasoningEfforts } from "../../../../src/schemas"
 
 interface ReasoningEffortProps {
+	apiConfiguration: ApiConfiguration
 	setApiConfigurationField: <K extends keyof ApiConfiguration>(field: K, value: ApiConfiguration[K]) => void
-	modelInfo: ModelInfo
 }
 
-export const ReasoningEffort = ({ setApiConfigurationField, modelInfo }: ReasoningEffortProps) => {
+export const ReasoningEffort = ({ apiConfiguration, setApiConfigurationField }: ReasoningEffortProps) => {
 	const { t } = useAppTranslation()
 
 	return (
@@ -19,7 +19,7 @@ export const ReasoningEffort = ({ setApiConfigurationField, modelInfo }: Reasoni
 				<label className="block font-medium mb-1">Model Reasoning Effort</label>
 			</div>
 			<Select
-				value={modelInfo.reasoningEffort}
+				value={apiConfiguration.reasoningEffort}
 				onValueChange={(value) =>
 					setApiConfigurationField("reasoningEffort", value as "high" | "medium" | "low")
 				}>

From 6a69d48119414a4d8814065fd91511065df01605 Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Thu, 10 Apr 2025 20:20:59 -0700
Subject: [PATCH 4/8] Remove copypasta

---
 webview-ui/src/components/settings/ReasoningEffort.tsx | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/webview-ui/src/components/settings/ReasoningEffort.tsx b/webview-ui/src/components/settings/ReasoningEffort.tsx
index 5ffb6682be..00ec57cc89 100644
--- a/webview-ui/src/components/settings/ReasoningEffort.tsx
+++ b/webview-ui/src/components/settings/ReasoningEffort.tsx
@@ -1,6 +1,6 @@
 import { useAppTranslation } from "@/i18n/TranslationContext"
 
-import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue, SelectSeparator } from "@/components/ui"
+import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from "@/components/ui"
 
 import { ApiConfiguration } from "../../../../src/shared/api"
 import { reasoningEfforts } from "../../../../src/schemas"
@@ -27,8 +27,6 @@ export const ReasoningEffort = ({ apiConfiguration, setApiConfigurationField }:
 					<SelectValue placeholder={t("settings:common.select")} />
 				</SelectTrigger>
 				<SelectContent>
-					<SelectItem value="openrouter">OpenRouter</SelectItem>
-					<SelectSeparator />
 					{reasoningEfforts.map((value) => (
 						<SelectItem key={value} value={value}>
 							{value}

From c091ba11b486fcda8e1497978318939d04ce8ccf Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Thu, 10 Apr 2025 21:58:58 -0700
Subject: [PATCH 5/8] Set reasoning effort for Grok 3 Mini

---
 evals/packages/types/src/roo-code-defaults.ts | 13 ++++++++-----
 evals/packages/types/src/roo-code.ts          | 13 +++++++++----
 src/api/providers/openai.ts                   | 17 ++++++++++++++++-
 3 files changed, 33 insertions(+), 10 deletions(-)

diff --git a/evals/packages/types/src/roo-code-defaults.ts b/evals/packages/types/src/roo-code-defaults.ts
index 8def51f085..f126f33ff0 100644
--- a/evals/packages/types/src/roo-code-defaults.ts
+++ b/evals/packages/types/src/roo-code-defaults.ts
@@ -20,18 +20,21 @@ export const rooCodeDefaults: RooCodeSettings = {
 	// 	thinking: false,
 	// },
 
+	modelTemperature: null,
+	// reasoningEffort: "high",
+
 	pinnedApiConfigs: {},
-	lastShownAnnouncementId: "mar-20-2025-3-10",
+	lastShownAnnouncementId: "apr-04-2025-boomerang",
 
 	autoApprovalEnabled: true,
 	alwaysAllowReadOnly: true,
 	alwaysAllowReadOnlyOutsideWorkspace: false,
 	alwaysAllowWrite: true,
 	alwaysAllowWriteOutsideWorkspace: false,
-	writeDelayMs: 200,
+	writeDelayMs: 1000,
 	alwaysAllowBrowser: true,
 	alwaysApproveResubmit: true,
-	requestDelaySeconds: 5,
+	requestDelaySeconds: 10,
 	alwaysAllowMcp: true,
 	alwaysAllowModeSwitch: true,
 	alwaysAllowSubtasks: true,
@@ -40,8 +43,8 @@ export const rooCodeDefaults: RooCodeSettings = {
 
 	browserToolEnabled: false,
 	browserViewportSize: "900x600",
-	screenshotQuality: 38,
-	remoteBrowserEnabled: true,
+	screenshotQuality: 75,
+	remoteBrowserEnabled: false,
 
 	enableCheckpoints: false,
 	checkpointStorage: "task",
diff --git a/evals/packages/types/src/roo-code.ts b/evals/packages/types/src/roo-code.ts
index 22bff70d16..32e7fd9750 100644
--- a/evals/packages/types/src/roo-code.ts
+++ b/evals/packages/types/src/roo-code.ts
@@ -96,7 +96,7 @@ export type TelemetrySetting = z.infer<typeof telemetrySettingsSchema>
  */
 
 export const modelInfoSchema = z.object({
-	maxTokens: z.number().optional(),
+	maxTokens: z.number().nullish(),
 	contextWindow: z.number(),
 	supportsImages: z.boolean().optional(),
 	supportsComputerUse: z.boolean().optional(),
@@ -373,11 +373,14 @@ export const providerSettingsSchema = z.object({
 	requestyApiKey: z.string().optional(),
 	requestyModelId: z.string().optional(),
 	requestyModelInfo: modelInfoSchema.optional(),
-	// Generic
+	// Claude 3.7 Sonnet Thinking
 	modelMaxTokens: z.number().optional(), // Currently only used by Anthropic hybrid thinking models.
 	modelMaxThinkingTokens: z.number().optional(), // Currently only used by Anthropic hybrid thinking models.
-	modelTemperature: z.number().nullish(),
+	// Generic
 	includeMaxTokens: z.boolean().optional(),
+	modelTemperature: z.number().nullish(),
+	reasoningEffort: z.enum(["low", "medium", "high"]).optional(),
+	rateLimitSeconds: z.number().optional(),
 	// Fake AI
 	fakeAi: z.unknown().optional(),
 })
@@ -457,11 +460,13 @@ const providerSettingsRecord: ProviderSettingsRecord = {
 	requestyModelId: undefined,
 	requestyModelInfo: undefined,
 	// Claude 3.7 Sonnet Thinking
-	modelTemperature: undefined,
 	modelMaxTokens: undefined,
 	modelMaxThinkingTokens: undefined,
 	// Generic
 	includeMaxTokens: undefined,
+	modelTemperature: undefined,
+	reasoningEffort: undefined,
+	rateLimitSeconds: undefined,
 	// Fake AI
 	fakeAi: undefined,
 }
diff --git a/src/api/providers/openai.ts b/src/api/providers/openai.ts
index fc739b3110..1e8e7ef30b 100644
--- a/src/api/providers/openai.ts
+++ b/src/api/providers/openai.ts
@@ -82,6 +82,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 		const urlHost = this._getUrlHost(modelUrl)
 		const deepseekReasoner = modelId.includes("deepseek-reasoner") || enabledR1Format
 		const ark = modelUrl.includes(".volces.com")
+
 		if (modelId.startsWith("o3-mini")) {
 			yield* this.handleO3FamilyMessage(modelId, systemPrompt, messages)
 			return
@@ -94,6 +95,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 			}
 
 			let convertedMessages
+
 			if (deepseekReasoner) {
 				convertedMessages = convertToR1Format([{ role: "user", content: systemPrompt }, ...messages])
 			} else if (ark || enabledLegacyFormat) {
@@ -112,16 +114,20 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 						],
 					}
 				}
+
 				convertedMessages = [systemMessage, ...convertToOpenAiMessages(messages)]
+
 				if (modelInfo.supportsPromptCache) {
 					// Note: the following logic is copied from openrouter:
 					// Add cache_control to the last two user messages
 					// (note: this works because we only ever add one user message at a time, but if we added multiple we'd need to mark the user message before the last assistant message)
 					const lastTwoUserMessages = convertedMessages.filter((msg) => msg.role === "user").slice(-2)
+
 					lastTwoUserMessages.forEach((msg) => {
 						if (typeof msg.content === "string") {
 							msg.content = [{ type: "text", text: msg.content }]
 						}
+
 						if (Array.isArray(msg.content)) {
 							// NOTE: this is fine since env details will always be added at the end. but if it weren't there, and the user added a image_url type message, it would pop a text part before it and then move it after to the end.
 							let lastTextPart = msg.content.filter((part) => part.type === "text").pop()
@@ -130,6 +136,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 								lastTextPart = { type: "text", text: "..." }
 								msg.content.push(lastTextPart)
 							}
+
 							// @ts-ignore-next-line
 							lastTextPart["cache_control"] = { type: "ephemeral" }
 						}
@@ -145,7 +152,9 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				messages: convertedMessages,
 				stream: true as const,
 				...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),
+				reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,
 			}
+
 			if (this.options.includeMaxTokens) {
 				requestOptions.max_tokens = modelInfo.maxTokens
 			}
@@ -185,6 +194,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 					lastUsage = chunk.usage
 				}
 			}
+
 			for (const chunk of matcher.final()) {
 				yield chunk
 			}
@@ -217,6 +227,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				type: "text",
 				text: response.choices[0]?.message.content || "",
 			}
+
 			yield this.processUsageMetrics(response.usage, modelInfo)
 		}
 	}
@@ -241,6 +252,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 	async completePrompt(prompt: string): Promise<string> {
 		try {
 			const isAzureAiInference = this._isAzureAiInference(this.options.openAiBaseUrl)
+
 			const requestOptions: OpenAI.Chat.Completions.ChatCompletionCreateParamsNonStreaming = {
 				model: this.getModel().id,
 				messages: [{ role: "user", content: prompt }],
@@ -250,11 +262,13 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				requestOptions,
 				isAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},
 			)
+
 			return response.choices[0]?.message.content || ""
 		} catch (error) {
 			if (error instanceof Error) {
 				throw new Error(`OpenAI completion error: ${error.message}`)
 			}
+
 			throw error
 		}
 	}
@@ -281,7 +295,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 					],
 					stream: true,
 					...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),
-					reasoning_effort: this.getModel().info.reasoningEffort,
+					reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,
 				},
 				methodIsAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},
 			)
@@ -333,6 +347,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 			}
 		}
 	}
+
 	private _getUrlHost(baseUrl?: string): string {
 		try {
 			return new URL(baseUrl ?? "").host

From 26bb8c9ecb4c8fae163eb732b301362c542ec188 Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Tue, 15 Apr 2025 11:47:30 -0700
Subject: [PATCH 6/8] Use translations

---
 webview-ui/src/components/settings/ReasoningEffort.tsx | 10 ++++------
 webview-ui/src/i18n/locales/en/settings.json           |  6 ++++++
 2 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/webview-ui/src/components/settings/ReasoningEffort.tsx b/webview-ui/src/components/settings/ReasoningEffort.tsx
index 00ec57cc89..7c8ee3a385 100644
--- a/webview-ui/src/components/settings/ReasoningEffort.tsx
+++ b/webview-ui/src/components/settings/ReasoningEffort.tsx
@@ -3,7 +3,7 @@ import { useAppTranslation } from "@/i18n/TranslationContext"
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from "@/components/ui"
 
 import { ApiConfiguration } from "../../../../src/shared/api"
-import { reasoningEfforts } from "../../../../src/schemas"
+import { reasoningEfforts, ReasoningEffort as ReasoningEffortType } from "../../../../src/schemas"
 
 interface ReasoningEffortProps {
 	apiConfiguration: ApiConfiguration
@@ -16,20 +16,18 @@ export const ReasoningEffort = ({ apiConfiguration, setApiConfigurationField }:
 	return (
 		<div className="flex flex-col gap-1">
 			<div className="flex justify-between items-center">
-				<label className="block font-medium mb-1">Model Reasoning Effort</label>
+				<label className="block font-medium mb-1">{t("settings:providers.reasoningEffort.label")}</label>
 			</div>
 			<Select
 				value={apiConfiguration.reasoningEffort}
-				onValueChange={(value) =>
-					setApiConfigurationField("reasoningEffort", value as "high" | "medium" | "low")
-				}>
+				onValueChange={(value) => setApiConfigurationField("reasoningEffort", value as ReasoningEffortType)}>
 				<SelectTrigger className="w-full">
 					<SelectValue placeholder={t("settings:common.select")} />
 				</SelectTrigger>
 				<SelectContent>
 					{reasoningEfforts.map((value) => (
 						<SelectItem key={value} value={value}>
-							{value}
+							{t(`settings:providers.reasoningEffort.${value}`)}
 						</SelectItem>
 					))}
 				</SelectContent>
diff --git a/webview-ui/src/i18n/locales/en/settings.json b/webview-ui/src/i18n/locales/en/settings.json
index b494ea01e5..e277085424 100644
--- a/webview-ui/src/i18n/locales/en/settings.json
+++ b/webview-ui/src/i18n/locales/en/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Rate limit",
 			"description": "Minimum time between API requests."
+		},
+		"reasoningEffort": {
+			"label": "Model Reasoning Effort",
+			"high": "High",
+			"medium": "Medium",
+			"low": "Low"
 		}
 	},
 	"browser": {

From 43117533c106732fdf79e130895a96f4168f24db Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Tue, 15 Apr 2025 11:52:46 -0700
Subject: [PATCH 7/8] Add translations

---
 webview-ui/src/i18n/locales/ca/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/de/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/es/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/fr/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/hi/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/it/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/ja/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/ko/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/pl/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/pt-BR/settings.json | 6 ++++++
 webview-ui/src/i18n/locales/tr/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/vi/settings.json    | 6 ++++++
 webview-ui/src/i18n/locales/zh-CN/settings.json | 6 ++++++
 webview-ui/src/i18n/locales/zh-TW/settings.json | 6 ++++++
 14 files changed, 84 insertions(+)

diff --git a/webview-ui/src/i18n/locales/ca/settings.json b/webview-ui/src/i18n/locales/ca/settings.json
index af009b4337..00fb251eab 100644
--- a/webview-ui/src/i18n/locales/ca/settings.json
+++ b/webview-ui/src/i18n/locales/ca/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Límit de freqüència",
 			"description": "Temps mínim entre sol·licituds d'API."
+		},
+		"reasoningEffort": {
+			"label": "Esforç de raonament del model",
+			"high": "Alt",
+			"medium": "Mitjà",
+			"low": "Baix"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/de/settings.json b/webview-ui/src/i18n/locales/de/settings.json
index 11ff0d5a06..59d986be18 100644
--- a/webview-ui/src/i18n/locales/de/settings.json
+++ b/webview-ui/src/i18n/locales/de/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Ratenbegrenzung",
 			"description": "Minimale Zeit zwischen API-Anfragen."
+		},
+		"reasoningEffort": {
+			"label": "Modell-Denkaufwand",
+			"high": "Hoch",
+			"medium": "Mittel",
+			"low": "Niedrig"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/es/settings.json b/webview-ui/src/i18n/locales/es/settings.json
index 0b1f40d5a2..af6e2b218e 100644
--- a/webview-ui/src/i18n/locales/es/settings.json
+++ b/webview-ui/src/i18n/locales/es/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Límite de tasa",
 			"description": "Tiempo mínimo entre solicitudes de API."
+		},
+		"reasoningEffort": {
+			"label": "Esfuerzo de razonamiento del modelo",
+			"high": "Alto",
+			"medium": "Medio",
+			"low": "Bajo"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/fr/settings.json b/webview-ui/src/i18n/locales/fr/settings.json
index d2499a90ad..948dfb127b 100644
--- a/webview-ui/src/i18n/locales/fr/settings.json
+++ b/webview-ui/src/i18n/locales/fr/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Limite de débit",
 			"description": "Temps minimum entre les requêtes API."
+		},
+		"reasoningEffort": {
+			"label": "Effort de raisonnement du modèle",
+			"high": "Élevé",
+			"medium": "Moyen",
+			"low": "Faible"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/hi/settings.json b/webview-ui/src/i18n/locales/hi/settings.json
index 8572ad1008..1aaf89e946 100644
--- a/webview-ui/src/i18n/locales/hi/settings.json
+++ b/webview-ui/src/i18n/locales/hi/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "दर सीमा",
 			"description": "API अनुरोधों के बीच न्यूनतम समय।"
+		},
+		"reasoningEffort": {
+			"label": "मॉडल तर्क प्रयास",
+			"high": "उच्च",
+			"medium": "मध्यम",
+			"low": "निम्न"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/it/settings.json b/webview-ui/src/i18n/locales/it/settings.json
index 50282e98f9..570bca7d2e 100644
--- a/webview-ui/src/i18n/locales/it/settings.json
+++ b/webview-ui/src/i18n/locales/it/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Limite di frequenza",
 			"description": "Tempo minimo tra le richieste API."
+		},
+		"reasoningEffort": {
+			"label": "Sforzo di ragionamento del modello",
+			"high": "Alto",
+			"medium": "Medio",
+			"low": "Basso"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/ja/settings.json b/webview-ui/src/i18n/locales/ja/settings.json
index e41d8e361c..101f56cd8a 100644
--- a/webview-ui/src/i18n/locales/ja/settings.json
+++ b/webview-ui/src/i18n/locales/ja/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "レート制限",
 			"description": "APIリクエスト間の最小時間。"
+		},
+		"reasoningEffort": {
+			"label": "モデル推論の労力",
+			"high": "高",
+			"medium": "中",
+			"low": "低"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/ko/settings.json b/webview-ui/src/i18n/locales/ko/settings.json
index 05e7aa2944..c13e7e8f73 100644
--- a/webview-ui/src/i18n/locales/ko/settings.json
+++ b/webview-ui/src/i18n/locales/ko/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "속도 제한",
 			"description": "API 요청 간 최소 시간."
+		},
+		"reasoningEffort": {
+			"label": "모델 추론 노력",
+			"high": "높음",
+			"medium": "중간",
+			"low": "낮음"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/pl/settings.json b/webview-ui/src/i18n/locales/pl/settings.json
index 2d27e9a85c..534ee15234 100644
--- a/webview-ui/src/i18n/locales/pl/settings.json
+++ b/webview-ui/src/i18n/locales/pl/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Limit szybkości",
 			"description": "Minimalny czas między żądaniami API."
+		},
+		"reasoningEffort": {
+			"label": "Wysiłek rozumowania modelu",
+			"high": "Wysoki",
+			"medium": "Średni",
+			"low": "Niski"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/pt-BR/settings.json b/webview-ui/src/i18n/locales/pt-BR/settings.json
index 9181d8fdb3..5df5798a6d 100644
--- a/webview-ui/src/i18n/locales/pt-BR/settings.json
+++ b/webview-ui/src/i18n/locales/pt-BR/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Limite de taxa",
 			"description": "Tempo mínimo entre requisições de API."
+		},
+		"reasoningEffort": {
+			"label": "Esforço de raciocínio do modelo",
+			"high": "Alto",
+			"medium": "Médio",
+			"low": "Baixo"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/tr/settings.json b/webview-ui/src/i18n/locales/tr/settings.json
index 5f26eea0b9..9723383005 100644
--- a/webview-ui/src/i18n/locales/tr/settings.json
+++ b/webview-ui/src/i18n/locales/tr/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Hız sınırı",
 			"description": "API istekleri arasındaki minimum süre."
+		},
+		"reasoningEffort": {
+			"label": "Model Akıl Yürütme Çabası",
+			"high": "Yüksek",
+			"medium": "Orta",
+			"low": "Düşük"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/vi/settings.json b/webview-ui/src/i18n/locales/vi/settings.json
index 824635fbf6..5ab7fe9b28 100644
--- a/webview-ui/src/i18n/locales/vi/settings.json
+++ b/webview-ui/src/i18n/locales/vi/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Giới hạn tốc độ",
 			"description": "Thời gian tối thiểu giữa các yêu cầu API."
+		},
+		"reasoningEffort": {
+			"label": "Nỗ lực suy luận của mô hình",
+			"high": "Cao",
+			"medium": "Trung bình",
+			"low": "Thấp"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/zh-CN/settings.json b/webview-ui/src/i18n/locales/zh-CN/settings.json
index 97067ffa62..da85a296bb 100644
--- a/webview-ui/src/i18n/locales/zh-CN/settings.json
+++ b/webview-ui/src/i18n/locales/zh-CN/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "请求频率限制",
 			"description": "设置API请求的最小间隔时间"
+		},
+		"reasoningEffort": {
+			"label": "模型推理强度",
+			"high": "高",
+			"medium": "中",
+			"low": "低"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/zh-TW/settings.json b/webview-ui/src/i18n/locales/zh-TW/settings.json
index cf99713793..f98c40e607 100644
--- a/webview-ui/src/i18n/locales/zh-TW/settings.json
+++ b/webview-ui/src/i18n/locales/zh-TW/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "速率限制",
 			"description": "API 請求間的最短時間"
+		},
+		"reasoningEffort": {
+			"label": "模型推理強度",
+			"high": "高",
+			"medium": "中",
+			"low": "低"
 		}
 	},
 	"browser": {

From 6498c8704efa95102c92f1a881b0de4a7d184dd3 Mon Sep 17 00:00:00 2001
From: cte <cestreich@gmail.com>
Date: Tue, 15 Apr 2025 12:30:02 -0700
Subject: [PATCH 8/8] Remove this check

---
 src/api/providers/openai.ts | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/api/providers/openai.ts b/src/api/providers/openai.ts
index 1e8e7ef30b..96984d90c1 100644
--- a/src/api/providers/openai.ts
+++ b/src/api/providers/openai.ts
@@ -152,7 +152,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				messages: convertedMessages,
 				stream: true as const,
 				...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),
-				reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,
+				reasoning_effort: this.getModel().info.reasoningEffort,
 			}
 
 			if (this.options.includeMaxTokens) {
@@ -295,7 +295,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 					],
 					stream: true,
 					...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),
-					reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,
+					reasoning_effort: this.getModel().info.reasoningEffort,
 				},
 				methodIsAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},
 			)