Expose reasoning effort option for reasoning models on OpenRouter (#2483)

cte · web-flow · commit e7a57ea7747b · 2025-04-15T13:51:52.000-07:00
* Specify reasoning effort for OpenRouter reasoning models

* Add ReasoningEffort type

* Fix ReasoningEffort props

* Remove copypasta

* Set reasoning effort for Grok 3 Mini

* Use translations

* Add translations

* Remove this check
diff --git a/src/api/index.ts b/src/api/index.ts
@@ -88,21 +88,25 @@ export function getModelParams({
 	model,
 	defaultMaxTokens,
 	defaultTemperature = 0,
+	defaultReasoningEffort,
 }: {
 	options: ApiHandlerOptions
 	model: ModelInfo
 	defaultMaxTokens?: number
 	defaultTemperature?: number
+	defaultReasoningEffort?: "low" | "medium" | "high"
 }) {
 	const {
 		modelMaxTokens: customMaxTokens,
 		modelMaxThinkingTokens: customMaxThinkingTokens,
 		modelTemperature: customTemperature,
+		reasoningEffort: customReasoningEffort,
 	} = options
 
 	let maxTokens = model.maxTokens ?? defaultMaxTokens
 	let thinking: BetaThinkingConfigParam | undefined = undefined
 	let temperature = customTemperature ?? defaultTemperature
+	const reasoningEffort = customReasoningEffort ?? defaultReasoningEffort
 
 	if (model.thinking) {
 		// Only honor `customMaxTokens` for thinking models.
@@ -118,5 +122,5 @@ export function getModelParams({
 		temperature = 1.0
 	}
 
-	return { maxTokens, thinking, temperature }
+	return { maxTokens, thinking, temperature, reasoningEffort }
 }
diff --git a/src/api/providers/openai.ts b/src/api/providers/openai.ts
@@ -82,6 +82,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 		const urlHost = this._getUrlHost(modelUrl)
 		const deepseekReasoner = modelId.includes("deepseek-reasoner") || enabledR1Format
 		const ark = modelUrl.includes(".volces.com")
+
 		if (modelId.startsWith("o3-mini")) {
 			yield* this.handleO3FamilyMessage(modelId, systemPrompt, messages)
 			return
@@ -94,6 +95,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 			}
 
 			let convertedMessages
+
 			if (deepseekReasoner) {
 				convertedMessages = convertToR1Format([{ role: "user", content: systemPrompt }, ...messages])
 			} else if (ark || enabledLegacyFormat) {
@@ -112,16 +114,20 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 						],
 					}
 				}
+
 				convertedMessages = [systemMessage, ...convertToOpenAiMessages(messages)]
+
 				if (modelInfo.supportsPromptCache) {
 					// Note: the following logic is copied from openrouter:
 					// Add cache_control to the last two user messages
 					// (note: this works because we only ever add one user message at a time, but if we added multiple we'd need to mark the user message before the last assistant message)
 					const lastTwoUserMessages = convertedMessages.filter((msg) => msg.role === "user").slice(-2)
+
 					lastTwoUserMessages.forEach((msg) => {
 						if (typeof msg.content === "string") {
 							msg.content = [{ type: "text", text: msg.content }]
 						}
+
 						if (Array.isArray(msg.content)) {
 							// NOTE: this is fine since env details will always be added at the end. but if it weren't there, and the user added a image_url type message, it would pop a text part before it and then move it after to the end.
 							let lastTextPart = msg.content.filter((part) => part.type === "text").pop()
@@ -130,6 +136,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 								lastTextPart = { type: "text", text: "..." }
 								msg.content.push(lastTextPart)
 							}
+
 							// @ts-ignore-next-line
 							lastTextPart["cache_control"] = { type: "ephemeral" }
 						}
@@ -145,7 +152,9 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				messages: convertedMessages,
 				stream: true as const,
 				...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),
+				reasoning_effort: this.getModel().info.reasoningEffort,
 			}
+
 			if (this.options.includeMaxTokens) {
 				requestOptions.max_tokens = modelInfo.maxTokens
 			}
@@ -185,6 +194,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 					lastUsage = chunk.usage
 				}
 			}
+
 			for (const chunk of matcher.final()) {
 				yield chunk
 			}
@@ -217,6 +227,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				type: "text",
 				text: response.choices[0]?.message.content || "",
 			}
+
 			yield this.processUsageMetrics(response.usage, modelInfo)
 		}
 	}
@@ -241,6 +252,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 	async completePrompt(prompt: string): Promise<string> {
 		try {
 			const isAzureAiInference = this._isAzureAiInference(this.options.openAiBaseUrl)
+
 			const requestOptions: OpenAI.Chat.Completions.ChatCompletionCreateParamsNonStreaming = {
 				model: this.getModel().id,
 				messages: [{ role: "user", content: prompt }],
@@ -250,11 +262,13 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				requestOptions,
 				isAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},
 			)
+
 			return response.choices[0]?.message.content || ""
 		} catch (error) {
 			if (error instanceof Error) {
 				throw new Error(`OpenAI completion error: ${error.message}`)
 			}
+
 			throw error
 		}
 	}
@@ -333,6 +347,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 			}
 		}
 	}
+
 	private _getUrlHost(baseUrl?: string): string {
 		try {
 			return new URL(baseUrl ?? "").host
diff --git a/src/api/providers/openrouter.ts b/src/api/providers/openrouter.ts
@@ -1,8 +1,7 @@
 import { Anthropic } from "@anthropic-ai/sdk"
 import { BetaThinkingConfigParam } from "@anthropic-ai/sdk/resources/beta"
-import axios, { AxiosRequestConfig } from "axios"
+import axios from "axios"
 import OpenAI from "openai"
-import delay from "delay"
 
 import { ApiHandlerOptions, ModelInfo, openRouterDefaultModelId, openRouterDefaultModelInfo } from "../../shared/api"
 import { parseApiPrice } from "../../utils/cost"
@@ -22,6 +21,12 @@ type OpenRouterChatCompletionParams = OpenAI.Chat.ChatCompletionCreateParams & {
 	transforms?: string[]
 	include_reasoning?: boolean
 	thinking?: BetaThinkingConfigParam
+	// https://openrouter.ai/docs/use-cases/reasoning-tokens
+	reasoning?: {
+		effort?: "high" | "medium" | "low"
+		max_tokens?: number
+		exclude?: boolean
+	}
 }
 
 export class OpenRouterHandler extends BaseProvider implements SingleCompletionHandler {
@@ -42,7 +47,7 @@ export class OpenRouterHandler extends BaseProvider implements SingleCompletionH
 		systemPrompt: string,
 		messages: Anthropic.Messages.MessageParam[],
 	): AsyncGenerator<ApiStreamChunk> {
-		let { id: modelId, maxTokens, thinking, temperature, topP } = this.getModel()
+		let { id: modelId, maxTokens, thinking, temperature, topP, reasoningEffort } = this.getModel()
 
 		// Convert Anthropic messages to OpenAI format.
 		let openAiMessages: OpenAI.Chat.ChatCompletionMessageParam[] = [
@@ -70,13 +75,16 @@ export class OpenRouterHandler extends BaseProvider implements SingleCompletionH
 						},
 					],
 				}
+
 				// Add cache_control to the last two user messages
 				// (note: this works because we only ever add one user message at a time, but if we added multiple we'd need to mark the user message before the last assistant message)
 				const lastTwoUserMessages = openAiMessages.filter((msg) => msg.role === "user").slice(-2)
+
 				lastTwoUserMessages.forEach((msg) => {
 					if (typeof msg.content === "string") {
 						msg.content = [{ type: "text", text: msg.content }]
 					}
+
 					if (Array.isArray(msg.content)) {
 						// NOTE: this is fine since env details will always be added at the end. but if it weren't there, and the user added a image_url type message, it would pop a text part before it and then move it after to the end.
 						let lastTextPart = msg.content.filter((part) => part.type === "text").pop()
@@ -113,6 +121,7 @@ export class OpenRouterHandler extends BaseProvider implements SingleCompletionH
 				}),
 			// This way, the transforms field will only be included in the parameters when openRouterUseMiddleOutTransform is true.
 			...((this.options.openRouterUseMiddleOutTransform ?? true) && { transforms: ["middle-out"] }),
+			...(reasoningEffort && { reasoning: { effort: reasoningEffort } }),
 		}
 
 		const stream = await this.client.chat.completions.create(completionParams)
diff --git a/webview-ui/src/components/settings/ApiOptions.tsx b/webview-ui/src/components/settings/ApiOptions.tsx
@@ -46,7 +46,7 @@ import {
 	OPENROUTER_DEFAULT_PROVIDER_NAME,
 } from "@/components/ui/hooks/useOpenRouterModelProviders"
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue, SelectSeparator, Button } from "@/components/ui"
-import { MODELS_BY_PROVIDER, PROVIDERS, VERTEX_REGIONS } from "./constants"
+import { MODELS_BY_PROVIDER, PROVIDERS, VERTEX_REGIONS, REASONING_MODELS } from "./constants"
 import { AWS_REGIONS } from "../../../../src/shared/aws_regions"
 import { VSCodeButtonLink } from "../common/VSCodeButtonLink"
 import { ModelInfoView } from "./ModelInfoView"
@@ -59,6 +59,7 @@ import { ThinkingBudget } from "./ThinkingBudget"
 import { R1FormatSetting } from "./R1FormatSetting"
 import { OpenRouterBalanceDisplay } from "./OpenRouterBalanceDisplay"
 import { RequestyBalanceDisplay } from "./RequestyBalanceDisplay"
+import { ReasoningEffort } from "./ReasoningEffort"
 
 interface ApiOptionsProps {
 	uriScheme: string | undefined
@@ -1538,6 +1539,13 @@ const ApiOptions = ({
 					</div>
 				)}
 
+			{selectedProvider === "openrouter" && REASONING_MODELS.has(selectedModelId) && (
+				<ReasoningEffort
+					apiConfiguration={apiConfiguration}
+					setApiConfigurationField={setApiConfigurationField}
+				/>
+			)}
+
 			{selectedProvider === "glama" && (
 				<ModelPicker
 					apiConfiguration={apiConfiguration}
@@ -1665,12 +1673,14 @@ const ApiOptions = ({
 								})()}
 						</>
 					)}
+
 					<ModelInfoView
 						selectedModelId={selectedModelId}
 						modelInfo={selectedModelInfo}
 						isDescriptionExpanded={isDescriptionExpanded}
 						setIsDescriptionExpanded={setIsDescriptionExpanded}
 					/>
+
 					<ThinkingBudget
 						key={`${selectedProvider}-${selectedModelId}`}
 						apiConfiguration={apiConfiguration}
diff --git a/webview-ui/src/components/settings/ReasoningEffort.tsx b/webview-ui/src/components/settings/ReasoningEffort.tsx
@@ -0,0 +1,37 @@
+import { useAppTranslation } from "@/i18n/TranslationContext"
+
+import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from "@/components/ui"
+
+import { ApiConfiguration } from "../../../../src/shared/api"
+import { reasoningEfforts, ReasoningEffort as ReasoningEffortType } from "../../../../src/schemas"
+
+interface ReasoningEffortProps {
+	apiConfiguration: ApiConfiguration
+	setApiConfigurationField: <K extends keyof ApiConfiguration>(field: K, value: ApiConfiguration[K]) => void
+}
+
+export const ReasoningEffort = ({ apiConfiguration, setApiConfigurationField }: ReasoningEffortProps) => {
+	const { t } = useAppTranslation()
+
+	return (
+		<div className="flex flex-col gap-1">
+			<div className="flex justify-between items-center">
+				<label className="block font-medium mb-1">{t("settings:providers.reasoningEffort.label")}</label>
+			</div>
+			<Select
+				value={apiConfiguration.reasoningEffort}
+				onValueChange={(value) => setApiConfigurationField("reasoningEffort", value as ReasoningEffortType)}>
+				<SelectTrigger className="w-full">
+					<SelectValue placeholder={t("settings:common.select")} />
+				</SelectTrigger>
+				<SelectContent>
+					{reasoningEfforts.map((value) => (
+						<SelectItem key={value} value={value}>
+							{t(`settings:providers.reasoningEffort.${value}`)}
+						</SelectItem>
+					))}
+				</SelectContent>
+			</Select>
+		</div>
+	)
+}
diff --git a/webview-ui/src/components/settings/constants.ts b/webview-ui/src/components/settings/constants.ts
@@ -46,3 +46,5 @@ export const VERTEX_REGIONS = [
 	{ value: "europe-west4", label: "europe-west4" },
 	{ value: "asia-southeast1", label: "asia-southeast1" },
 ]
+
+export const REASONING_MODELS = new Set(["x-ai/grok-3-mini-beta"])
diff --git a/webview-ui/src/i18n/locales/ca/settings.json b/webview-ui/src/i18n/locales/ca/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Límit de freqüència",
 			"description": "Temps mínim entre sol·licituds d'API."
+		},
+		"reasoningEffort": {
+			"label": "Esforç de raonament del model",
+			"high": "Alt",
+			"medium": "Mitjà",
+			"low": "Baix"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/de/settings.json b/webview-ui/src/i18n/locales/de/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Ratenbegrenzung",
 			"description": "Minimale Zeit zwischen API-Anfragen."
+		},
+		"reasoningEffort": {
+			"label": "Modell-Denkaufwand",
+			"high": "Hoch",
+			"medium": "Mittel",
+			"low": "Niedrig"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/en/settings.json b/webview-ui/src/i18n/locales/en/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Rate limit",
 			"description": "Minimum time between API requests."
+		},
+		"reasoningEffort": {
+			"label": "Model Reasoning Effort",
+			"high": "High",
+			"medium": "Medium",
+			"low": "Low"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/es/settings.json b/webview-ui/src/i18n/locales/es/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Límite de tasa",
 			"description": "Tiempo mínimo entre solicitudes de API."
+		},
+		"reasoningEffort": {
+			"label": "Esfuerzo de razonamiento del modelo",
+			"high": "Alto",
+			"medium": "Medio",
+			"low": "Bajo"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/fr/settings.json b/webview-ui/src/i18n/locales/fr/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Limite de débit",
 			"description": "Temps minimum entre les requêtes API."
+		},
+		"reasoningEffort": {
+			"label": "Effort de raisonnement du modèle",
+			"high": "Élevé",
+			"medium": "Moyen",
+			"low": "Faible"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/hi/settings.json b/webview-ui/src/i18n/locales/hi/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "दर सीमा",
 			"description": "API अनुरोधों के बीच न्यूनतम समय।"
+		},
+		"reasoningEffort": {
+			"label": "मॉडल तर्क प्रयास",
+			"high": "उच्च",
+			"medium": "मध्यम",
+			"low": "निम्न"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/it/settings.json b/webview-ui/src/i18n/locales/it/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "Limite di frequenza",
 			"description": "Tempo minimo tra le richieste API."
+		},
+		"reasoningEffort": {
+			"label": "Sforzo di ragionamento del modello",
+			"high": "Alto",
+			"medium": "Medio",
+			"low": "Basso"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/ja/settings.json b/webview-ui/src/i18n/locales/ja/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "レート制限",
 			"description": "APIリクエスト間の最小時間。"
+		},
+		"reasoningEffort": {
+			"label": "モデル推論の労力",
+			"high": "高",
+			"medium": "中",
+			"low": "低"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/ko/settings.json b/webview-ui/src/i18n/locales/ko/settings.json
@@ -225,6 +225,12 @@
 		"rateLimitSeconds": {
 			"label": "속도 제한",
 			"description": "API 요청 간 최소 시간."
+		},
+		"reasoningEffort": {
+			"label": "모델 추론 노력",
+			"high": "높음",
+			"medium": "중간",
+			"low": "낮음"
 		}
 	},
 	"browser": {
diff --git a/webview-ui/src/i18n/locales/pl/settings.json b/webview-ui/src/i18n/locales/pl/settings.json
diff --git a/webview-ui/src/i18n/locales/pt-BR/settings.json b/webview-ui/src/i18n/locales/pt-BR/settings.json
diff --git a/webview-ui/src/i18n/locales/tr/settings.json b/webview-ui/src/i18n/locales/tr/settings.json
diff --git a/webview-ui/src/i18n/locales/vi/settings.json b/webview-ui/src/i18n/locales/vi/settings.json
diff --git a/webview-ui/src/i18n/locales/zh-CN/settings.json b/webview-ui/src/i18n/locales/zh-CN/settings.json
diff --git a/webview-ui/src/i18n/locales/zh-TW/settings.json b/webview-ui/src/i18n/locales/zh-TW/settings.json

Original file line number	Diff line number	Diff line change
`@@ -82,6 +82,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`82`	`82`	`const urlHost = this._getUrlHost(modelUrl)`
`83`	`83`	`const deepseekReasoner = modelId.includes("deepseek-reasoner") \|\| enabledR1Format`
`84`	`84`	`const ark = modelUrl.includes(".volces.com")`
	`85`	`+`
`85`	`86`	`if (modelId.startsWith("o3-mini")) {`
`86`	`87`	`yield* this.handleO3FamilyMessage(modelId, systemPrompt, messages)`
`87`	`88`	`return`
`@@ -94,6 +95,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`94`	`95`	`}`
`95`	`96`
`96`	`97`	`let convertedMessages`
	`98`	`+`
`97`	`99`	`if (deepseekReasoner) {`
`98`	`100`	`convertedMessages = convertToR1Format([{ role: "user", content: systemPrompt }, ...messages])`
`99`	`101`	`} else if (ark \|\| enabledLegacyFormat) {`
`@@ -112,16 +114,20 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`112`	`114`	`],`
`113`	`115`	`}`
`114`	`116`	`}`
	`117`	`+`
`115`	`118`	`convertedMessages = [systemMessage, ...convertToOpenAiMessages(messages)]`
	`119`	`+`
`116`	`120`	`if (modelInfo.supportsPromptCache) {`
`117`	`121`	`// Note: the following logic is copied from openrouter:`
`118`	`122`	`// Add cache_control to the last two user messages`
`119`	`123`	`// (note: this works because we only ever add one user message at a time, but if we added multiple we'd need to mark the user message before the last assistant message)`
`120`	`124`	`const lastTwoUserMessages = convertedMessages.filter((msg) => msg.role === "user").slice(-2)`
	`125`	`+`
`121`	`126`	`lastTwoUserMessages.forEach((msg) => {`
`122`	`127`	`if (typeof msg.content === "string") {`
`123`	`128`	`msg.content = [{ type: "text", text: msg.content }]`
`124`	`129`	`}`
	`130`	`+`
`125`	`131`	`if (Array.isArray(msg.content)) {`
`126`	`132`	`// NOTE: this is fine since env details will always be added at the end. but if it weren't there, and the user added a image_url type message, it would pop a text part before it and then move it after to the end.`
`127`	`133`	`let lastTextPart = msg.content.filter((part) => part.type === "text").pop()`
`@@ -130,6 +136,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`130`	`136`	`lastTextPart = { type: "text", text: "..." }`
`131`	`137`	`msg.content.push(lastTextPart)`
`132`	`138`	`}`
	`139`	`+`
`133`	`140`	`// @ts-ignore-next-line`
`134`	`141`	`lastTextPart["cache_control"] = { type: "ephemeral" }`
`135`	`142`	`}`
`@@ -145,7 +152,9 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`145`	`152`	`messages: convertedMessages,`
`146`	`153`	`stream: true as const,`
`147`	`154`	`...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),`
	`155`	`+ reasoning_effort: this.getModel().info.reasoningEffort,`
`148`	`156`	`}`
	`157`	`+`
`149`	`158`	`if (this.options.includeMaxTokens) {`
`150`	`159`	`requestOptions.max_tokens = modelInfo.maxTokens`
`151`	`160`	`}`
`@@ -185,6 +194,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`185`	`194`	`lastUsage = chunk.usage`
`186`	`195`	`}`
`187`	`196`	`}`
	`197`	`+`
`188`	`198`	`for (const chunk of matcher.final()) {`
`189`	`199`	`yield chunk`
`190`	`200`	`}`
`@@ -217,6 +227,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`217`	`227`	`type: "text",`
`218`	`228`	`text: response.choices[0]?.message.content \|\| "",`
`219`	`229`	`}`
	`230`	`+`
`220`	`231`	`yield this.processUsageMetrics(response.usage, modelInfo)`
`221`	`232`	`}`
`222`	`233`	`}`
`@@ -241,6 +252,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`241`	`252`	`async completePrompt(prompt: string): Promise<string> {`
`242`	`253`	`try {`
`243`	`254`	`const isAzureAiInference = this._isAzureAiInference(this.options.openAiBaseUrl)`
	`255`	`+`
`244`	`256`	`const requestOptions: OpenAI.Chat.Completions.ChatCompletionCreateParamsNonStreaming = {`
`245`	`257`	`model: this.getModel().id,`
`246`	`258`	`messages: [{ role: "user", content: prompt }],`
`@@ -250,11 +262,13 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`250`	`262`	`requestOptions,`
`251`	`263`	`isAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},`
`252`	`264`	`)`
	`265`	`+`
`253`	`266`	`return response.choices[0]?.message.content \|\| ""`
`254`	`267`	`} catch (error) {`
`255`	`268`	`if (error instanceof Error) {`
`256`	`269`	throw new Error(`OpenAI completion error: ${error.message}`)
`257`	`270`	`}`
	`271`	`+`
`258`	`272`	`throw error`
`259`	`273`	`}`
`260`	`274`	`}`
`@@ -333,6 +347,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`333`	`347`	`}`
`334`	`348`	`}`
`335`	`349`	`}`
	`350`	`+`
`336`	`351`	`private _getUrlHost(baseUrl?: string): string {`
`337`	`352`	`try {`
`338`	`353`	`return new URL(baseUrl ?? "").host`
Original file line number	Diff line number	Diff line change
`@@ -46,3 +46,5 @@ export const VERTEX_REGIONS = [`
`46`	`46`	`{ value: "europe-west4", label: "europe-west4" },`
`47`	`47`	`{ value: "asia-southeast1", label: "asia-southeast1" },`
`48`	`48`	`]`
	`49`	`+`
	`50`	`+export const REASONING_MODELS = new Set(["x-ai/grok-3-mini-beta"])`