Set reasoning effort for Grok 3 Mini

cte · cte · commit c091ba11b486 · 2025-04-10T21:58:58.000-07:00
diff --git a/evals/packages/types/src/roo-code-defaults.ts b/evals/packages/types/src/roo-code-defaults.ts
@@ -20,18 +20,21 @@ export const rooCodeDefaults: RooCodeSettings = {
 	// 	thinking: false,
 	// },
 
+	modelTemperature: null,
+	// reasoningEffort: "high",
+
 	pinnedApiConfigs: {},
-	lastShownAnnouncementId: "mar-20-2025-3-10",
+	lastShownAnnouncementId: "apr-04-2025-boomerang",
 
 	autoApprovalEnabled: true,
 	alwaysAllowReadOnly: true,
 	alwaysAllowReadOnlyOutsideWorkspace: false,
 	alwaysAllowWrite: true,
 	alwaysAllowWriteOutsideWorkspace: false,
-	writeDelayMs: 200,
+	writeDelayMs: 1000,
 	alwaysAllowBrowser: true,
 	alwaysApproveResubmit: true,
-	requestDelaySeconds: 5,
+	requestDelaySeconds: 10,
 	alwaysAllowMcp: true,
 	alwaysAllowModeSwitch: true,
 	alwaysAllowSubtasks: true,
@@ -40,8 +43,8 @@ export const rooCodeDefaults: RooCodeSettings = {
 
 	browserToolEnabled: false,
 	browserViewportSize: "900x600",
-	screenshotQuality: 38,
-	remoteBrowserEnabled: true,
+	screenshotQuality: 75,
+	remoteBrowserEnabled: false,
 
 	enableCheckpoints: false,
 	checkpointStorage: "task",
diff --git a/evals/packages/types/src/roo-code.ts b/evals/packages/types/src/roo-code.ts
@@ -96,7 +96,7 @@ export type TelemetrySetting = z.infer<typeof telemetrySettingsSchema>
  */
 
 export const modelInfoSchema = z.object({
-	maxTokens: z.number().optional(),
+	maxTokens: z.number().nullish(),
 	contextWindow: z.number(),
 	supportsImages: z.boolean().optional(),
 	supportsComputerUse: z.boolean().optional(),
@@ -373,11 +373,14 @@ export const providerSettingsSchema = z.object({
 	requestyApiKey: z.string().optional(),
 	requestyModelId: z.string().optional(),
 	requestyModelInfo: modelInfoSchema.optional(),
-	// Generic
+	// Claude 3.7 Sonnet Thinking
 	modelMaxTokens: z.number().optional(), // Currently only used by Anthropic hybrid thinking models.
 	modelMaxThinkingTokens: z.number().optional(), // Currently only used by Anthropic hybrid thinking models.
-	modelTemperature: z.number().nullish(),
+	// Generic
 	includeMaxTokens: z.boolean().optional(),
+	modelTemperature: z.number().nullish(),
+	reasoningEffort: z.enum(["low", "medium", "high"]).optional(),
+	rateLimitSeconds: z.number().optional(),
 	// Fake AI
 	fakeAi: z.unknown().optional(),
 })
@@ -457,11 +460,13 @@ const providerSettingsRecord: ProviderSettingsRecord = {
 	requestyModelId: undefined,
 	requestyModelInfo: undefined,
 	// Claude 3.7 Sonnet Thinking
-	modelTemperature: undefined,
 	modelMaxTokens: undefined,
 	modelMaxThinkingTokens: undefined,
 	// Generic
 	includeMaxTokens: undefined,
+	modelTemperature: undefined,
+	reasoningEffort: undefined,
+	rateLimitSeconds: undefined,
 	// Fake AI
 	fakeAi: undefined,
 }
diff --git a/src/api/providers/openai.ts b/src/api/providers/openai.ts
@@ -82,6 +82,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 		const urlHost = this._getUrlHost(modelUrl)
 		const deepseekReasoner = modelId.includes("deepseek-reasoner") || enabledR1Format
 		const ark = modelUrl.includes(".volces.com")
+
 		if (modelId.startsWith("o3-mini")) {
 			yield* this.handleO3FamilyMessage(modelId, systemPrompt, messages)
 			return
@@ -94,6 +95,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 			}
 
 			let convertedMessages
+
 			if (deepseekReasoner) {
 				convertedMessages = convertToR1Format([{ role: "user", content: systemPrompt }, ...messages])
 			} else if (ark || enabledLegacyFormat) {
@@ -112,16 +114,20 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 						],
 					}
 				}
+
 				convertedMessages = [systemMessage, ...convertToOpenAiMessages(messages)]
+
 				if (modelInfo.supportsPromptCache) {
 					// Note: the following logic is copied from openrouter:
 					// Add cache_control to the last two user messages
 					// (note: this works because we only ever add one user message at a time, but if we added multiple we'd need to mark the user message before the last assistant message)
 					const lastTwoUserMessages = convertedMessages.filter((msg) => msg.role === "user").slice(-2)
+
 					lastTwoUserMessages.forEach((msg) => {
 						if (typeof msg.content === "string") {
 							msg.content = [{ type: "text", text: msg.content }]
 						}
+
 						if (Array.isArray(msg.content)) {
 							// NOTE: this is fine since env details will always be added at the end. but if it weren't there, and the user added a image_url type message, it would pop a text part before it and then move it after to the end.
 							let lastTextPart = msg.content.filter((part) => part.type === "text").pop()
@@ -130,6 +136,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 								lastTextPart = { type: "text", text: "..." }
 								msg.content.push(lastTextPart)
 							}
+
 							// @ts-ignore-next-line
 							lastTextPart["cache_control"] = { type: "ephemeral" }
 						}
@@ -145,7 +152,9 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				messages: convertedMessages,
 				stream: true as const,
 				...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),
+				reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,
 			}
+
 			if (this.options.includeMaxTokens) {
 				requestOptions.max_tokens = modelInfo.maxTokens
 			}
@@ -185,6 +194,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 					lastUsage = chunk.usage
 				}
 			}
+
 			for (const chunk of matcher.final()) {
 				yield chunk
 			}
@@ -217,6 +227,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				type: "text",
 				text: response.choices[0]?.message.content || "",
 			}
+
 			yield this.processUsageMetrics(response.usage, modelInfo)
 		}
 	}
@@ -241,6 +252,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 	async completePrompt(prompt: string): Promise<string> {
 		try {
 			const isAzureAiInference = this._isAzureAiInference(this.options.openAiBaseUrl)
+
 			const requestOptions: OpenAI.Chat.Completions.ChatCompletionCreateParamsNonStreaming = {
 				model: this.getModel().id,
 				messages: [{ role: "user", content: prompt }],
@@ -250,11 +262,13 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 				requestOptions,
 				isAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},
 			)
+
 			return response.choices[0]?.message.content || ""
 		} catch (error) {
 			if (error instanceof Error) {
 				throw new Error(`OpenAI completion error: ${error.message}`)
 			}
+
 			throw error
 		}
 	}
@@ -281,7 +295,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 					],
 					stream: true,
 					...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),
-					reasoning_effort: this.getModel().info.reasoningEffort,
+					reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,
 				},
 				methodIsAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},
 			)
@@ -333,6 +347,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 			}
 		}
 	}
+
 	private _getUrlHost(baseUrl?: string): string {
 		try {
 			return new URL(baseUrl ?? "").host

Original file line number	Diff line number	Diff line change
`@@ -82,6 +82,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`82`	`82`	`const urlHost = this._getUrlHost(modelUrl)`
`83`	`83`	`const deepseekReasoner = modelId.includes("deepseek-reasoner") \|\| enabledR1Format`
`84`	`84`	`const ark = modelUrl.includes(".volces.com")`
	`85`	`+`
`85`	`86`	`if (modelId.startsWith("o3-mini")) {`
`86`	`87`	`yield* this.handleO3FamilyMessage(modelId, systemPrompt, messages)`
`87`	`88`	`return`
`@@ -94,6 +95,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`94`	`95`	`}`
`95`	`96`
`96`	`97`	`let convertedMessages`
	`98`	`+`
`97`	`99`	`if (deepseekReasoner) {`
`98`	`100`	`convertedMessages = convertToR1Format([{ role: "user", content: systemPrompt }, ...messages])`
`99`	`101`	`} else if (ark \|\| enabledLegacyFormat) {`
`@@ -112,16 +114,20 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`112`	`114`	`],`
`113`	`115`	`}`
`114`	`116`	`}`
	`117`	`+`
`115`	`118`	`convertedMessages = [systemMessage, ...convertToOpenAiMessages(messages)]`
	`119`	`+`
`116`	`120`	`if (modelInfo.supportsPromptCache) {`
`117`	`121`	`// Note: the following logic is copied from openrouter:`
`118`	`122`	`// Add cache_control to the last two user messages`
`119`	`123`	`// (note: this works because we only ever add one user message at a time, but if we added multiple we'd need to mark the user message before the last assistant message)`
`120`	`124`	`const lastTwoUserMessages = convertedMessages.filter((msg) => msg.role === "user").slice(-2)`
	`125`	`+`
`121`	`126`	`lastTwoUserMessages.forEach((msg) => {`
`122`	`127`	`if (typeof msg.content === "string") {`
`123`	`128`	`msg.content = [{ type: "text", text: msg.content }]`
`124`	`129`	`}`
	`130`	`+`
`125`	`131`	`if (Array.isArray(msg.content)) {`
`126`	`132`	`// NOTE: this is fine since env details will always be added at the end. but if it weren't there, and the user added a image_url type message, it would pop a text part before it and then move it after to the end.`
`127`	`133`	`let lastTextPart = msg.content.filter((part) => part.type === "text").pop()`
`@@ -130,6 +136,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`130`	`136`	`lastTextPart = { type: "text", text: "..." }`
`131`	`137`	`msg.content.push(lastTextPart)`
`132`	`138`	`}`
	`139`	`+`
`133`	`140`	`// @ts-ignore-next-line`
`134`	`141`	`lastTextPart["cache_control"] = { type: "ephemeral" }`
`135`	`142`	`}`
`@@ -145,7 +152,9 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`145`	`152`	`messages: convertedMessages,`
`146`	`153`	`stream: true as const,`
`147`	`154`	`...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),`
	`155`	`+ reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,`
`148`	`156`	`}`
	`157`	`+`
`149`	`158`	`if (this.options.includeMaxTokens) {`
`150`	`159`	`requestOptions.max_tokens = modelInfo.maxTokens`
`151`	`160`	`}`
`@@ -185,6 +194,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`185`	`194`	`lastUsage = chunk.usage`
`186`	`195`	`}`
`187`	`196`	`}`
	`197`	`+`
`188`	`198`	`for (const chunk of matcher.final()) {`
`189`	`199`	`yield chunk`
`190`	`200`	`}`
`@@ -217,6 +227,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`217`	`227`	`type: "text",`
`218`	`228`	`text: response.choices[0]?.message.content \|\| "",`
`219`	`229`	`}`
	`230`	`+`
`220`	`231`	`yield this.processUsageMetrics(response.usage, modelInfo)`
`221`	`232`	`}`
`222`	`233`	`}`
`@@ -241,6 +252,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`241`	`252`	`async completePrompt(prompt: string): Promise<string> {`
`242`	`253`	`try {`
`243`	`254`	`const isAzureAiInference = this._isAzureAiInference(this.options.openAiBaseUrl)`
	`255`	`+`
`244`	`256`	`const requestOptions: OpenAI.Chat.Completions.ChatCompletionCreateParamsNonStreaming = {`
`245`	`257`	`model: this.getModel().id,`
`246`	`258`	`messages: [{ role: "user", content: prompt }],`
`@@ -250,11 +262,13 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`250`	`262`	`requestOptions,`
`251`	`263`	`isAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},`
`252`	`264`	`)`
	`265`	`+`
`253`	`266`	`return response.choices[0]?.message.content \|\| ""`
`254`	`267`	`} catch (error) {`
`255`	`268`	`if (error instanceof Error) {`
`256`	`269`	throw new Error(`OpenAI completion error: ${error.message}`)
`257`	`270`	`}`
	`271`	`+`
`258`	`272`	`throw error`
`259`	`273`	`}`
`260`	`274`	`}`
`@@ -281,7 +295,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`281`	`295`	`],`
`282`	`296`	`stream: true,`
`283`	`297`	`...(isGrokXAI ? {} : { stream_options: { include_usage: true } }),`
`284`		`- reasoning_effort: this.getModel().info.reasoningEffort,`
	`298`	`+ reasoning_effort: modelId === "grok-3-mini-beta" ? "high" : this.getModel().info.reasoningEffort,`
`285`	`299`	`},`
`286`	`300`	`methodIsAzureAiInference ? { path: AZURE_AI_INFERENCE_PATH } : {},`
`287`	`301`	`)`
`@@ -333,6 +347,7 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl`
`333`	`347`	`}`
`334`	`348`	`}`
`335`	`349`	`}`
	`350`	`+`
`336`	`351`	`private _getUrlHost(baseUrl?: string): string {`
`337`	`352`	`try {`
`338`	`353`	`return new URL(baseUrl ?? "").host`