RooCodeInc
diff --git a/‎src/shared/__tests__/api.spec.ts‎
Lines changed: 64 additions & 0 deletions b/‎src/shared/__tests__/api.spec.ts‎
Lines changed: 64 additions & 0 deletions
diff --git a/‎src/shared/api.ts‎
Lines changed: 7 additions & 1 deletion b/‎src/shared/api.ts‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎webview-ui/src/components/settings/ApiOptions.tsx‎
Lines changed: 8 additions & 0 deletions b/‎webview-ui/src/components/settings/ApiOptions.tsx‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎webview-ui/src/components/settings/MaxTokensControl.tsx‎
Lines changed: 79 additions & 0 deletions b/‎webview-ui/src/components/settings/MaxTokensControl.tsx‎
Lines changed: 79 additions & 0 deletions
diff --git a/‎webview-ui/src/components/settings/__tests__/MaxTokensControl.spec.tsx‎
Lines changed: 117 additions & 0 deletions b/‎webview-ui/src/components/settings/__tests__/MaxTokensControl.spec.tsx‎
Lines changed: 117 additions & 0 deletions
diff --git a/‎webview-ui/src/i18n/locales/ca/settings.json‎
Lines changed: 9 additions & 0 deletions b/‎webview-ui/src/i18n/locales/ca/settings.json‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎webview-ui/src/i18n/locales/de/settings.json‎
Lines changed: 9 additions & 0 deletions b/‎webview-ui/src/i18n/locales/de/settings.json‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎webview-ui/src/i18n/locales/en/settings.json‎
Lines changed: 9 additions & 0 deletions b/‎webview-ui/src/i18n/locales/en/settings.json‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎webview-ui/src/i18n/locales/es/settings.json‎
Lines changed: 9 additions & 0 deletions b/‎webview-ui/src/i18n/locales/es/settings.json‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎webview-ui/src/i18n/locales/fr/settings.json‎
Lines changed: 9 additions & 0 deletions b/‎webview-ui/src/i18n/locales/fr/settings.json‎
Lines changed: 9 additions & 0 deletions
@@ -154,6 +154,70 @@ describe("getModelMaxOutputTokens", () => {
 
 		expect(getModelMaxOutputTokens({ modelId: "test", model, settings })).toBe(16_384)
 	})
+
+	test("should use user-configured modelMaxTokens for non-reasoning models", () => {
+		const settings: ProviderSettings = {
+			modelMaxTokens: 16000,
+		}
+
+		const result = getModelMaxOutputTokens({
+			modelId: "gpt-4",
+			model: mockModel,
+			settings,
+		})
+
+		expect(result).toBe(16000)
+	})
+
+	test("should ignore modelMaxTokens when it's 0 or negative", () => {
+		const settings: ProviderSettings = {
+			modelMaxTokens: 0,
+		}
+
+		const result = getModelMaxOutputTokens({
+			modelId: "claude-3-5-sonnet",
+			model: mockModel,
+			settings,
+		})
+
+		// Should fall back to model's maxTokens
+		expect(result).toBe(8192)
+	})
+
+	test("should prioritize user-configured modelMaxTokens over model's default", () => {
+		const modelWithHighMaxTokens: ModelInfo = {
+			maxTokens: 64000,
+			contextWindow: 200000,
+			supportsPromptCache: true,
+		}
+
+		const settings: ProviderSettings = {
+			modelMaxTokens: 32000,
+		}
+
+		const result = getModelMaxOutputTokens({
+			modelId: "some-model",
+			model: modelWithHighMaxTokens,
+			settings,
+		})
+
+		expect(result).toBe(32000)
+	})
+
+	test("should use modelMaxTokens even for Anthropic models when configured", () => {
+		const settings: ProviderSettings = {
+			modelMaxTokens: 20000,
+		}
+
+		const result = getModelMaxOutputTokens({
+			modelId: "claude-3-5-sonnet",
+			model: mockModel,
+			settings,
+			format: "anthropic",
+		})
+
+		expect(result).toBe(20000)
+	})
 })
 
 describe("shouldUseReasoningBudget", () => {
 
@@ -70,8 +70,14 @@ export const getModelMaxOutputTokens = ({
 		return settings.claudeCodeMaxOutputTokens || CLAUDE_CODE_DEFAULT_MAX_OUTPUT_TOKENS
 	}
 
+	// Check for user-configured modelMaxTokens FIRST (new logic)
+	if (settings?.modelMaxTokens && settings.modelMaxTokens > 0) {
+		return settings.modelMaxTokens
+	}
+
+	// Existing reasoning budget logic
 	if (shouldUseReasoningBudget({ model, settings })) {
-		return settings?.modelMaxTokens || DEFAULT_HYBRID_REASONING_MODEL_MAX_TOKENS
+		return DEFAULT_HYBRID_REASONING_MODEL_MAX_TOKENS
 	}
 
 	const isAnthropicContext =
 
@@ -81,6 +81,7 @@ import { DiffSettingsControl } from "./DiffSettingsControl"
 import { TemperatureControl } from "./TemperatureControl"
 import { RateLimitSecondsControl } from "./RateLimitSecondsControl"
 import { ConsecutiveMistakeLimitControl } from "./ConsecutiveMistakeLimitControl"
+import { MaxTokensControl } from "./MaxTokensControl"
 import { BedrockCustomArn } from "./providers/BedrockCustomArn"
 import { buildDocLink } from "@src/utils/docLinks"
 
@@ -574,6 +575,13 @@ const ApiOptions = ({
 							onChange={handleInputChange("modelTemperature", noTransform)}
 							maxValue={2}
 						/>
+						<MaxTokensControl
+							value={apiConfiguration.modelMaxTokens}
+							onChange={(value) => setApiConfigurationField("modelMaxTokens", value)}
+							modelInfo={selectedModelInfo}
+							minValue={1000}
+							maxValue={selectedModelInfo?.maxTokens || 200000}
+						/>
 						<RateLimitSecondsControl
 							value={apiConfiguration.rateLimitSeconds || 0}
 							onChange={(value) => setApiConfigurationField("rateLimitSeconds", value)}
 
@@ -0,0 +1,79 @@
+import React from "react"
+import { useAppTranslation } from "@/i18n/TranslationContext"
+import { ModelInfo } from "@roo-code/types"
+import { Input } from "@/components/ui"
+
+interface MaxTokensControlProps {
+	value?: number
+	onChange: (value: number | undefined) => void
+	modelInfo?: ModelInfo
+	minValue?: number
+	maxValue?: number
+	className?: string
+}
+
+export const MaxTokensControl: React.FC<MaxTokensControlProps> = ({
+	value,
+	onChange,
+	modelInfo,
+	minValue = 1000,
+	maxValue = 200000,
+	className,
+}) => {
+	const { t } = useAppTranslation()
+
+	const handleChange = (e: React.ChangeEvent<HTMLInputElement>) => {
+		const inputValue = e.target.value
+		if (inputValue === "") {
+			onChange(undefined)
+			return
+		}
+
+		const numValue = parseInt(inputValue, 10)
+		if (!isNaN(numValue)) {
+			onChange(numValue)
+		}
+	}
+
+	const effectiveMaxValue = modelInfo?.maxTokens || maxValue
+	const displayValue = value ?? 8192
+
+	const isValueTooHigh = displayValue > effectiveMaxValue
+	const isValueTooLow = displayValue < minValue
+	const hasError = isValueTooHigh || isValueTooLow
+
+	return (
+		<div className={`flex flex-col gap-1 ${className || ""}`}>
+			<label htmlFor="max-output-tokens" className="block font-medium mb-1">
+				{t("settings:providers.maxOutputTokens.label")}
+			</label>
+			<Input
+				id="max-output-tokens"
+				type="number"
+				value={displayValue}
+				onChange={handleChange}
+				min={minValue}
+				max={effectiveMaxValue}
+				className={`w-full ${hasError ? "border-red-500 focus:border-red-500" : ""}`}
+			/>
+			<div className="text-sm text-vscode-descriptionForeground">
+				{t("settings:providers.maxOutputTokens.description")}
+			</div>
+			{isValueTooHigh && (
+				<div className="text-sm text-red-500">
+					{t("settings:providers.maxOutputTokens.validation.tooHigh", { max: effectiveMaxValue })}
+				</div>
+			)}
+			{isValueTooLow && (
+				<div className="text-sm text-red-500">
+					{t("settings:providers.maxOutputTokens.validation.tooLow", { min: minValue })}
+				</div>
+			)}
+			{modelInfo && !hasError && (
+				<div className="text-sm text-vscode-descriptionForeground">
+					{t("settings:providers.maxOutputTokens.modelSupports", { max: modelInfo.maxTokens })}
+				</div>
+			)}
+		</div>
+	)
+}
@@ -0,0 +1,117 @@
+import { describe, test, expect, vi } from "vitest"
+import { render, screen, fireEvent } from "@testing-library/react"
+import { MaxTokensControl } from "../MaxTokensControl"
+import { ModelInfo } from "@roo-code/types"
+
+// Mock the translation hook
+vi.mock("@/i18n/TranslationContext", () => ({
+	useAppTranslation: () => ({
+		t: (key: string, params?: any) => {
+			if (params) {
+				return key.replace(/\{\{(\w+)\}\}/g, (_, p) => params[p])
+			}
+			return key
+		},
+	}),
+}))
+
+describe("MaxTokensControl", () => {
+	const mockOnChange = vi.fn()
+	const defaultProps = {
+		onChange: mockOnChange,
+	}
+
+	beforeEach(() => {
+		mockOnChange.mockClear()
+	})
+
+	test("should render with default value of 8192", () => {
+		render(<MaxTokensControl {...defaultProps} />)
+
+		const input = screen.getByRole("spinbutton") as HTMLInputElement
+		expect(input.value).toBe("8192")
+	})
+
+	test("should render with provided value", () => {
+		render(<MaxTokensControl {...defaultProps} value={16000} />)
+
+		const input = screen.getByRole("spinbutton") as HTMLInputElement
+		expect(input.value).toBe("16000")
+	})
+
+	test("should call onChange when value changes", () => {
+		render(<MaxTokensControl {...defaultProps} />)
+
+		const input = screen.getByRole("spinbutton")
+		fireEvent.change(input, { target: { value: "20000" } })
+
+		expect(mockOnChange).toHaveBeenCalledWith(20000)
+	})
+
+	test("should call onChange with undefined when input is cleared", () => {
+		render(<MaxTokensControl {...defaultProps} value={16000} />)
+
+		const input = screen.getByRole("spinbutton")
+		fireEvent.change(input, { target: { value: "" } })
+
+		expect(mockOnChange).toHaveBeenCalledWith(undefined)
+	})
+
+	test("should show validation error when value exceeds model max", () => {
+		const modelInfo: ModelInfo = {
+			maxTokens: 10000,
+			contextWindow: 100000,
+			supportsPromptCache: true,
+		}
+
+		render(<MaxTokensControl {...defaultProps} value={15000} modelInfo={modelInfo} />)
+
+		expect(screen.getByText("settings:providers.maxOutputTokens.validation.tooHigh")).toBeInTheDocument()
+	})
+
+	test("should show validation error when value is below minimum", () => {
+		render(<MaxTokensControl {...defaultProps} value={500} minValue={1000} />)
+
+		expect(screen.getByText("settings:providers.maxOutputTokens.validation.tooLow")).toBeInTheDocument()
+	})
+
+	test("should show model support message when valid", () => {
+		const modelInfo: ModelInfo = {
+			maxTokens: 64000,
+			contextWindow: 200000,
+			supportsPromptCache: true,
+		}
+
+		render(<MaxTokensControl {...defaultProps} value={8192} modelInfo={modelInfo} />)
+
+		expect(screen.getByText("settings:providers.maxOutputTokens.modelSupports")).toBeInTheDocument()
+	})
+
+	test("should use custom min and max values", () => {
+		render(<MaxTokensControl {...defaultProps} minValue={2000} maxValue={50000} />)
+
+		const input = screen.getByRole("spinbutton") as HTMLInputElement
+		expect(input.min).toBe("2000")
+		expect(input.max).toBe("50000")
+	})
+
+	test("should use model's maxTokens as max value when available", () => {
+		const modelInfo: ModelInfo = {
+			maxTokens: 32000,
+			contextWindow: 100000,
+			supportsPromptCache: true,
+		}
+
+		render(<MaxTokensControl {...defaultProps} modelInfo={modelInfo} />)
+
+		const input = screen.getByRole("spinbutton") as HTMLInputElement
+		expect(input.max).toBe("32000")
+	})
+
+	test("should apply error styling when validation fails", () => {
+		render(<MaxTokensControl {...defaultProps} value={500} minValue={1000} />)
+
+		const input = screen.getByRole("spinbutton")
+		expect(input.className).toContain("border-red-500")
+	})
+})
@@ -386,6 +386,15 @@
 			"placeholder": "Per defecte: claude",
 			"maxTokensLabel": "Tokens màxims de sortida",
 			"maxTokensDescription": "Nombre màxim de tokens de sortida per a les respostes de Claude Code. El valor per defecte és 8000."
+		},
+		"maxOutputTokens": {
+			"label": "Tokens màxims de sortida",
+			"description": "Nombre màxim de tokens a reservar per a la sortida del model. El valor predeterminat és 8192.",
+			"validation": {
+				"tooHigh": "El valor excedeix el màxim del model de {{max}} tokens",
+				"tooLow": "El valor ha de ser almenys {{min}} tokens"
+			},
+			"modelSupports": "Aquest model admet fins a {{max}} tokens"
 		}
 	},
 	"browser": {
 
@@ -386,6 +386,15 @@
 			"placeholder": "Standard: claude",
 			"maxTokensLabel": "Maximale Ausgabe-Tokens",
 			"maxTokensDescription": "Maximale Anzahl an Ausgabe-Tokens für Claude Code-Antworten. Standard ist 8000."
+		},
+		"maxOutputTokens": {
+			"label": "Maximale Ausgabe-Token",
+			"description": "Maximale Anzahl von Token, die für die Modellausgabe reserviert werden sollen. Standard ist 8192.",
+			"validation": {
+				"tooHigh": "Wert überschreitet das Maximum des Modells von {{max}} Token",
+				"tooLow": "Wert muss mindestens {{min}} Token betragen"
+			},
+			"modelSupports": "Dieses Modell unterstützt bis zu {{max}} Token"
 		}
 	},
 	"browser": {
 
@@ -367,6 +367,15 @@
 			"label": "Rate limit",
 			"description": "Minimum time between API requests."
 		},
+		"maxOutputTokens": {
+			"label": "Max Output Tokens",
+			"description": "Maximum number of tokens to reserve for model output. Default is 8192.",
+			"validation": {
+				"tooHigh": "Value exceeds model's maximum of {{max}} tokens",
+				"tooLow": "Value must be at least {{min}} tokens"
+			},
+			"modelSupports": "This model supports up to {{max}} tokens"
+		},
 		"consecutiveMistakeLimit": {
 			"label": "Error & Repetition Limit",
 			"description": "Number of consecutive errors or repeated actions before showing 'Roo is having trouble' dialog",
 
@@ -367,6 +367,15 @@
 			"label": "Límite de tasa",
 			"description": "Tiempo mínimo entre solicitudes de API."
 		},
+		"maxOutputTokens": {
+			"label": "Tokens máximos de salida",
+			"description": "Número máximo de tokens a reservar para la salida del modelo. El valor predeterminado es 8192.",
+			"validation": {
+				"tooHigh": "El valor excede el máximo del modelo de {{max}} tokens",
+				"tooLow": "El valor debe ser al menos {{min}} tokens"
+			},
+			"modelSupports": "Este modelo admite hasta {{max}} tokens"
+		},
 		"consecutiveMistakeLimit": {
 			"label": "Límite de errores y repeticiones",
 			"description": "Número de errores consecutivos o acciones repetidas antes de mostrar el diálogo 'Roo está teniendo problemas'",
 
@@ -386,6 +386,15 @@
 			"placeholder": "Défaut : claude",
 			"maxTokensLabel": "Jetons de sortie max",
 			"maxTokensDescription": "Nombre maximum de jetons de sortie pour les réponses de Claude Code. La valeur par défaut est 8000."
+		},
+		"maxOutputTokens": {
+			"label": "Tokens de sortie maximum",
+			"description": "Nombre maximum de tokens à réserver pour la sortie du modèle. La valeur par défaut est 8192.",
+			"validation": {
+				"tooHigh": "La valeur dépasse le maximum du modèle de {{max}} tokens",
+				"tooLow": "La valeur doit être d'au moins {{min}} tokens"
+			},
+			"modelSupports": "Ce modèle prend en charge jusqu'à {{max}} tokens"
 		}
 	},
 	"browser": {
Original file line number	Diff line number	Diff line change
`@@ -70,8 +70,14 @@ export const getModelMaxOutputTokens = ({`
`70`	`70`	`return settings.claudeCodeMaxOutputTokens \|\| CLAUDE_CODE_DEFAULT_MAX_OUTPUT_TOKENS`
`71`	`71`	`}`
`72`	`72`
	`73`	`+ // Check for user-configured modelMaxTokens FIRST (new logic)`
	`74`	`+ if (settings?.modelMaxTokens && settings.modelMaxTokens > 0) {`
	`75`	`+ return settings.modelMaxTokens`
	`76`	`+ }`
	`77`	`+`
	`78`	`+ // Existing reasoning budget logic`
`73`	`79`	`if (shouldUseReasoningBudget({ model, settings })) {`
`74`		`- return settings?.modelMaxTokens \|\| DEFAULT_HYBRID_REASONING_MODEL_MAX_TOKENS`
	`80`	`+ return DEFAULT_HYBRID_REASONING_MODEL_MAX_TOKENS`
`75`	`81`	`}`
`76`	`82`
`77`	`83`	`const isAnthropicContext =`