feat: add OpenAI context window error handling

daniel-lxs · daniel-lxs · commit 7d127946208f · 2025-08-11T21:16:00.000-05:00
- Add comprehensive context window error detection for OpenAI, OpenRouter, Anthropic, and Cerebras - Implement automatic retry with aggressive context truncation (25% reduction) - Use proper profile settings for condensing operations - Add robust error handling with try-catch blocks Based on PR #5479 from cline/cline repository
diff --git a/src/core/context/context-management/context-error-handling.ts b/src/core/context/context-management/context-error-handling.ts
@@ -0,0 +1,69 @@
+import { APIError } from "openai"
+
+export function checkContextWindowExceededError(error: unknown): boolean {
+	return (
+		checkIsOpenAIContextWindowError(error) ||
+		checkIsOpenRouterContextWindowError(error) ||
+		checkIsAnthropicContextWindowError(error) ||
+		checkIsCerebrasContextWindowError(error)
+	)
+}
+
+function checkIsOpenRouterContextWindowError(error: any): boolean {
+	try {
+		const status = error?.status ?? error?.code ?? error?.error?.status ?? error?.response?.status
+		const message: string = String(error?.message || error?.error?.message || "")
+
+		// Known OpenAI/OpenRouter-style signal (code 400 and message includes "context length")
+		const CONTEXT_ERROR_PATTERNS = [
+			/\bcontext\s*(?:length|window)\b/i,
+			/\bmaximum\s*context\b/i,
+			/\b(?:input\s*)?tokens?\s*exceed/i,
+			/\btoo\s*many\s*tokens?\b/i,
+		] as const
+
+		return String(status) === "400" && CONTEXT_ERROR_PATTERNS.some((pattern) => pattern.test(message))
+	} catch {
+		return false
+	}
+}
+
+// Docs: https://platform.openai.com/docs/guides/error-codes/api-errors
+function checkIsOpenAIContextWindowError(error: unknown): boolean {
+	try {
+		// Check for LengthFinishReasonError
+		if (error && typeof error === "object" && "name" in error && error.name === "LengthFinishReasonError") {
+			return true
+		}
+
+		const KNOWN_CONTEXT_ERROR_SUBSTRINGS = ["token", "context length"] as const
+
+		return (
+			Boolean(error) &&
+			error instanceof APIError &&
+			error.code?.toString() === "400" &&
+			KNOWN_CONTEXT_ERROR_SUBSTRINGS.some((substring) => error.message.includes(substring))
+		)
+	} catch {
+		return false
+	}
+}
+
+function checkIsAnthropicContextWindowError(response: any): boolean {
+	try {
+		return response?.error?.error?.type === "invalid_request_error"
+	} catch {
+		return false
+	}
+}
+
+function checkIsCerebrasContextWindowError(response: any): boolean {
+	try {
+		const status = response?.status ?? response?.code ?? response?.error?.status ?? response?.response?.status
+		const message: string = String(response?.message || response?.error?.message || "")
+
+		return String(status) === "400" && message.includes("Please reduce the length of the messages or completion")
+	} catch {
+		return false
+	}
+}
diff --git a/src/core/task/Task.ts b/src/core/task/Task.ts
@@ -86,6 +86,7 @@ import { MultiSearchReplaceDiffStrategy } from "../diff/strategies/multi-search-
 import { MultiFileSearchReplaceDiffStrategy } from "../diff/strategies/multi-file-search-replace"
 import { readApiMessages, saveApiMessages, readTaskMessages, saveTaskMessages, taskMetadata } from "../task-persistence"
 import { getEnvironmentDetails } from "../environment/getEnvironmentDetails"
+import { checkContextWindowExceededError } from "../context/context-management/context-error-handling"
 import {
 	type CheckpointDiffOptions,
 	type CheckpointRestoreOptions,
@@ -2121,6 +2122,59 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 		})()
 	}
 
+	private async handleContextWindowExceededError(): Promise<void> {
+		const state = await this.providerRef.deref()?.getState()
+		const { profileThresholds = {} } = state ?? {}
+
+		const { contextTokens } = this.getTokenUsage()
+		const modelInfo = this.api.getModel().info
+		const maxTokens = getModelMaxOutputTokens({
+			modelId: this.api.getModel().id,
+			model: modelInfo,
+			settings: this.apiConfiguration,
+		})
+		const contextWindow = modelInfo.contextWindow
+
+		// Get the current profile ID the same way as in attemptApiRequest
+		const currentProfileId =
+			state?.listApiConfigMeta?.find((profile: any) => profile.name === state?.currentApiConfigName)?.id ??
+			"default"
+
+		// Force aggressive truncation by removing 25% of the conversation history
+		const truncateResult = await truncateConversationIfNeeded({
+			messages: this.apiConversationHistory,
+			totalTokens: contextTokens || 0,
+			maxTokens,
+			contextWindow,
+			apiHandler: this.api,
+			autoCondenseContext: true,
+			autoCondenseContextPercent: 75, // Force 25% reduction
+			systemPrompt: await this.getSystemPrompt(),
+			taskId: this.taskId,
+			profileThresholds,
+			currentProfileId,
+		})
+
+		if (truncateResult.messages !== this.apiConversationHistory) {
+			await this.overwriteApiConversationHistory(truncateResult.messages)
+		}
+
+		if (truncateResult.summary) {
+			const { summary, cost, prevContextTokens, newContextTokens = 0 } = truncateResult
+			const contextCondense: ContextCondense = { summary, cost, newContextTokens, prevContextTokens }
+			await this.say(
+				"condense_context",
+				undefined /* text */,
+				undefined /* images */,
+				false /* partial */,
+				undefined /* checkpoint */,
+				undefined /* progressStatus */,
+				{ isNonInteractive: true } /* options */,
+				contextCondense,
+			)
+		}
+	}
+
 	public async *attemptApiRequest(retryAttempt: number = 0): ApiStream {
 		const state = await this.providerRef.deref()?.getState()
 
@@ -2308,6 +2362,16 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 			this.isWaitingForFirstChunk = false
 		} catch (error) {
 			this.isWaitingForFirstChunk = false
+			const isContextWindowExceededError = checkContextWindowExceededError(error)
+
+			// If it's a context window error and we haven't already retried for this reason
+			if (isContextWindowExceededError && retryAttempt === 0) {
+				await this.handleContextWindowExceededError()
+				// Retry the request after handling the context window error
+				yield* this.attemptApiRequest(retryAttempt + 1)
+				return
+			}
+
 			// note that this api_req_failed ask is unique in that we only present this option if the api hasn't streamed any content yet (ie it fails on the first chunk due), as it would allow them to hit a retry button. However if the api failed mid-stream, it could be in any arbitrary state where some tools may have executed, so that error is handled differently and requires cancelling the task entirely.
 			if (autoApprovalEnabled && alwaysApproveResubmit) {
 				let errorMsg