RooCodeInc
diff --git a/‎src/api/transform/model-params.ts‎
Lines changed: 3 additions & 2 deletions b/‎src/api/transform/model-params.ts‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎src/api/transform/reasoning.ts‎
Lines changed: 5 additions & 11 deletions b/‎src/api/transform/reasoning.ts‎
Lines changed: 5 additions & 11 deletions
diff --git a/‎src/shared/__tests__/api.test.ts‎
Lines changed: 154 additions & 0 deletions b/‎src/shared/__tests__/api.test.ts‎
Lines changed: 154 additions & 0 deletions
diff --git a/‎src/shared/api.ts‎
Lines changed: 48 additions & 1 deletion b/‎src/shared/api.ts‎
Lines changed: 48 additions & 1 deletion
diff --git a/‎webview-ui/src/__mocks__/components/chat/TaskHeader.tsx‎
Lines changed: 1 addition & 13 deletions b/‎webview-ui/src/__mocks__/components/chat/TaskHeader.tsx‎
Lines changed: 1 addition & 13 deletions
diff --git a/‎webview-ui/src/__tests__/getMaxTokensForModel.test.tsx‎
Lines changed: 0 additions & 81 deletions b/‎webview-ui/src/__tests__/getMaxTokensForModel.test.tsx‎
Lines changed: 0 additions & 81 deletions
@@ -1,4 +1,5 @@
-import type { ApiHandlerOptions, ModelInfo } from "../../shared/api"
+import type { ModelInfo, ProviderSettings } from "../../shared/api"
+
 import { ANTHROPIC_DEFAULT_MAX_TOKENS } from "../providers/constants"
 
 export type ModelParams = {
@@ -19,7 +20,7 @@ export function getModelParams({
 	defaultMaxTokens,
 	defaultTemperature = 0,
 }: {
-	options: ApiHandlerOptions
+	options: ProviderSettings
 	model: ModelInfo
 	defaultMaxTokens?: number
 	defaultTemperature?: number
 
@@ -2,6 +2,7 @@ import { BetaThinkingConfigParam } from "@anthropic-ai/sdk/resources/beta"
 import OpenAI from "openai"
 
 import { ModelInfo, ProviderSettings } from "../../schemas"
+import { shouldUseReasoningBudget, shouldUseReasoningEffort } from "../../shared/api"
 
 import type { ModelParams } from "./model-params"
 
@@ -21,21 +22,14 @@ export type GetModelResoningOptions = {
 	settings: ProviderSettings
 }
 
-const shouldUseReasoningBudget = (model: ModelInfo, settings: ProviderSettings, params: ModelParams) =>
-	(model.requiredReasoningBudget || (model.supportsReasoningBudget && settings.enableReasoningEffort)) &&
-	params.reasoningBudget
-
-const shouldUseReasoningEffort = (model: ModelInfo, params: ModelParams) =>
-	model.supportsReasoningEffort && params.reasoningEffort
-
 export const getOpenRouterReasoning = ({
 	model,
 	params,
 	settings,
 }: GetModelResoningOptions): OpenRouterReasoningParams | undefined =>
-	shouldUseReasoningBudget(model, settings, params)
+	shouldUseReasoningBudget({ model, settings })
 		? { max_tokens: params.reasoningBudget }
-		: shouldUseReasoningEffort(model, params)
+		: shouldUseReasoningEffort({ model, settings })
 			? { effort: params.reasoningEffort }
 			: undefined
 
@@ -44,7 +38,7 @@ export const getAnthropicReasoning = ({
 	params,
 	settings,
 }: GetModelResoningOptions): AnthropicReasoningParams | undefined =>
-	shouldUseReasoningBudget(model, settings, params)
+	shouldUseReasoningBudget({ model, settings })
 		? { type: "enabled", budget_tokens: params.reasoningBudget! }
 		: undefined
 
@@ -53,4 +47,4 @@ export const getOpenAiReasoning = ({
 	params,
 	settings,
 }: GetModelResoningOptions): OpenAiReasoningParams | undefined =>
-	shouldUseReasoningEffort(model, params) ? { reasoning_effort: params.reasoningEffort } : undefined
+	shouldUseReasoningEffort({ model, settings }) ? { reasoning_effort: params.reasoningEffort } : undefined
@@ -0,0 +1,154 @@
+// npx jest src/shared/__tests__/api.test.ts
+
+import { type ModelInfo, ProviderSettings, getModelMaxOutputTokens } from "../api"
+
+describe("getMaxTokensForModel", () => {
+	/**
+	 * Testing the specific fix in commit cc79178f:
+	 * For thinking models, use apiConfig.modelMaxTokens if available,
+	 * otherwise fall back to 8192 (not modelInfo.maxTokens)
+	 */
+
+	it("should return apiConfig.modelMaxTokens for thinking models when provided", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			requiredReasoningBudget: true,
+			maxTokens: 8000,
+		}
+
+		const settings: ProviderSettings = {
+			modelMaxTokens: 4000,
+		}
+
+		expect(getModelMaxOutputTokens({ model, settings })).toBe(4000)
+	})
+
+	it("should return 16_384 for thinking models when modelMaxTokens not provided", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			requiredReasoningBudget: true,
+			maxTokens: 8000,
+		}
+
+		const settings = {}
+
+		expect(getModelMaxOutputTokens({ model, settings })).toBe(16_384)
+	})
+
+	it("should return 16_384 for thinking models when apiConfig is undefined", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			requiredReasoningBudget: true,
+			maxTokens: 8000,
+		}
+
+		expect(getModelMaxOutputTokens({ model, settings: undefined })).toBe(16_384)
+	})
+
+	it("should return modelInfo.maxTokens for non-thinking models", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			maxTokens: 8000,
+		}
+
+		const settings: ProviderSettings = {
+			modelMaxTokens: 4000,
+		}
+
+		expect(getModelMaxOutputTokens({ model, settings })).toBe(8000)
+	})
+
+	it("should return undefined for non-thinking models with undefined maxTokens", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+		}
+
+		const settings: ProviderSettings = {
+			modelMaxTokens: 4000,
+		}
+
+		expect(getModelMaxOutputTokens({ model, settings })).toBeUndefined()
+	})
+
+	test("should return maxTokens from modelInfo when thinking is false", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			maxTokens: 2048,
+		}
+
+		const settings: ProviderSettings = {
+			modelMaxTokens: 4096,
+		}
+
+		const result = getModelMaxOutputTokens({ model, settings })
+		expect(result).toBe(2048)
+	})
+
+	test("should return modelMaxTokens from apiConfig when thinking is true", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			maxTokens: 2048,
+			requiredReasoningBudget: true,
+		}
+
+		const settings: ProviderSettings = {
+			modelMaxTokens: 4096,
+		}
+
+		const result = getModelMaxOutputTokens({ model, settings })
+		expect(result).toBe(4096)
+	})
+
+	test("should fallback to DEFAULT_THINKING_MODEL_MAX_TOKENS when thinking is true but apiConfig.modelMaxTokens is not defined", () => {
+		const model: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			maxTokens: 2048,
+			requiredReasoningBudget: true,
+		}
+
+		const settings: ProviderSettings = {}
+
+		const result = getModelMaxOutputTokens({ model, settings: undefined })
+		expect(result).toBe(16_384)
+	})
+
+	test("should handle undefined inputs gracefully", () => {
+		const modelInfoOnly: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			maxTokens: 2048,
+		}
+
+		expect(getModelMaxOutputTokens({ model: modelInfoOnly, settings: undefined })).toBe(2048)
+	})
+
+	test("should handle missing properties gracefully", () => {
+		const modelInfoWithoutMaxTokens: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			requiredReasoningBudget: true,
+		}
+
+		const settings: ProviderSettings = {
+			modelMaxTokens: 4096,
+		}
+
+		expect(getModelMaxOutputTokens({ model: modelInfoWithoutMaxTokens, settings })).toBe(4096)
+
+		const modelInfoWithoutThinking: ModelInfo = {
+			contextWindow: 200_000,
+			supportsPromptCache: true,
+			maxTokens: 2048,
+		}
+
+		expect(getModelMaxOutputTokens({ model: modelInfoWithoutThinking, settings: undefined })).toBe(2048)
+	})
+})
@@ -2,7 +2,7 @@ import { ModelInfo, ProviderName, ProviderSettings } from "../schemas"
 
 export type { ModelInfo, ProviderName, ProviderSettings }
 
-export type ApiHandlerOptions = Omit<ProviderSettings, "apiProvider" | "id">
+export type ApiHandlerOptions = Omit<ProviderSettings, "apiProvider">
 
 // Anthropic
 // https://docs.anthropic.com/en/docs/about-claude/models
@@ -1921,3 +1921,50 @@ export function toRouterName(value?: string): RouterName {
 export type ModelRecord = Record<string, ModelInfo>
 
 export type RouterModels = Record<RouterName, ModelRecord>
+
+export const shouldUseReasoningBudget = ({
+	model,
+	settings,
+}: {
+	model: ModelInfo
+	settings?: ProviderSettings
+}): boolean => !!model.requiredReasoningBudget || (!!model.supportsReasoningBudget && !!settings?.enableReasoningEffort)
+
+export const shouldUseReasoningEffort = ({
+	model,
+	settings,
+}: {
+	model: ModelInfo
+	settings?: ProviderSettings
+}): boolean => !!model.supportsReasoningEffort && (!!model.reasoningEffort || !!settings?.reasoningEffort)
+
+export const DEFAULT_HYBRID_REASONING_MODEL_MAX_TOKENS = 16_384
+export const DEFAULT_HYBRID_REASONING_MODEL_THINKING_TOKENS = 8_192
+
+export const getModelMaxOutputTokens = ({
+	model,
+	settings,
+}: {
+	model: ModelInfo
+	settings?: ProviderSettings
+}): number | undefined => {
+	if (shouldUseReasoningBudget({ model, settings })) {
+		return settings?.modelMaxTokens || DEFAULT_HYBRID_REASONING_MODEL_MAX_TOKENS
+	}
+
+	return model.maxTokens ?? undefined
+}
+
+export const getModelMaxThinkingTokens = ({
+	model,
+	settings,
+}: {
+	model: ModelInfo
+	settings?: ProviderSettings
+}): number | undefined => {
+	if (shouldUseReasoningBudget({ model, settings })) {
+		return settings?.modelMaxThinkingTokens || DEFAULT_HYBRID_REASONING_MODEL_THINKING_TOKENS
+	}
+
+	return undefined
+}
@@ -1,15 +1,3 @@
-import React from "react"
-// Import the actual utility instead of reimplementing it
-import { getMaxTokensForModel } from "@/utils/model-utils"
-
-// Re-export the utility function to maintain the same interface
-export { getMaxTokensForModel }
-
-/**
- * Mock version of the TaskHeader component
- */
-const TaskHeader: React.FC<any> = () => {
-	return <div data-testid="mocked-task-header">Mocked TaskHeader</div>
-}
+const TaskHeader = () => <div data-testid="mocked-task-header">Mocked TaskHeader</div>
 
 export default TaskHeader