fix(openai-native): background resume/poll logging + terminal handling for 401/403; types: GPT-5 Pro metadata — no prompt cache, no reasoningEffort flag; tests: remove duplicate GPT‑5 Pro background test

hannesrudolph · hannesrudolph · commit 51d391d215db · 2025-10-16T19:47:58.000-06:00
diff --git a/packages/types/src/providers/openai.ts b/packages/types/src/providers/openai.ts
@@ -41,9 +41,10 @@ export const openAiNativeModels = {
 		maxTokens: 128000,
 		contextWindow: 400000,
 		supportsImages: true,
-		supportsPromptCache: true,
+		// GPT-5 Pro does NOT support prompt caching
+		supportsPromptCache: false,
+		// Reasoning effort is not user-configurable for this model; do not expose the flag or default
 		supportsReasoningEffort: false,
-		reasoningEffort: "high",
 		inputPrice: 15.0,
 		outputPrice: 120.0,
 		description:
diff --git a/src/api/providers/__tests__/openai-native.spec.ts b/src/api/providers/__tests__/openai-native.spec.ts
@@ -1842,26 +1842,6 @@ describe("OpenAI Native background mode behavior", () => {
 		expect(requestBodyWithOptionFalse.stream).toBe(true)
 	})
 
-	it("auto-enables background mode for gpt-5-pro when no override is specified", async () => {
-		const handler = new OpenAiNativeHandler({
-			apiModelId: "gpt-5-pro-2025-10-06",
-			openAiNativeApiKey: "test",
-			// no openAiNativeBackgroundMode provided
-		})
-
-		mockResponsesCreate.mockResolvedValueOnce(createMinimalIterable())
-
-		const chunks: any[] = []
-		for await (const chunk of handler.createMessage(systemPrompt, baseMessages, metadataStoreFalse)) {
-			chunks.push(chunk)
-		}
-
-		expect(chunks).not.toHaveLength(0)
-		const requestBody = mockResponsesCreate.mock.calls[0][0]
-		expect(requestBody.background).toBe(true)
-		expect(requestBody.stream).toBe(true)
-		expect(requestBody.store).toBe(true)
-	})
 	it("forces store:true and includes background:true when falling back to SSE", async () => {
 		const handler = new OpenAiNativeHandler({
 			apiModelId: "gpt-5-pro-2025-10-06",
diff --git a/src/api/providers/openai-native.ts b/src/api/providers/openai-native.ts
@@ -1323,7 +1323,28 @@ export class OpenAiNativeHandler extends BaseProvider implements SingleCompletio
 				})
 
 				if (!res.ok) {
-					throw new Error(`Resume request failed (${res.status})`)
+					// Attach status and classify permanent failures
+					const err: any = new Error(`Resume request failed (${res.status})`)
+					err.status = res.status
+
+					// 401/403 are permanent for the current request - emit failed and stop
+					if (res.status === 401 || res.status === 403) {
+						yield {
+							type: "status",
+							mode: "background",
+							status: "failed",
+							responseId,
+						}
+						throw createTerminalBackgroundError(`Resume unauthorized/forbidden (${res.status})`)
+					}
+
+					// Other statuses (e.g., 404/429/5xx) are treated as transient; log and retry with backoff
+					console.warn?.("[openai-native] resume attempt failed", {
+						attempt,
+						status: res.status,
+						responseId,
+					})
+					throw err
 				}
 				if (!res.body) {
 					throw new Error("Resume request failed (no body)")
@@ -1358,10 +1379,24 @@ export class OpenAiNativeHandler extends BaseProvider implements SingleCompletio
 			} catch (err) {
 				// If terminal error, don't keep retrying resume; fall back to polling immediately
 				const delay = resumeBaseDelayMs * Math.pow(2, attempt)
+
 				if (isTerminalBackgroundError(err)) {
+					console.warn?.("[openai-native] resume terminated", {
+						attempt,
+						responseId,
+						error: (err as any)?.message,
+					})
 					break
 				}
-				// Otherwise retry with backoff
+
+				// Otherwise retry with backoff and lightweight logging for diagnostics
+				console.warn?.("[openai-native] resume retry", {
+					attempt,
+					responseId,
+					error: (err as any)?.message,
+					nextDelayMs: delay,
+				})
+
 				if (delay > 0) {
 					await new Promise((r) => setTimeout(r, delay))
 				}
@@ -1392,7 +1427,23 @@ export class OpenAiNativeHandler extends BaseProvider implements SingleCompletio
 				})
 
 				if (!pollRes.ok) {
-					// transient; wait and retry
+					// Treat auth/permission as permanent; others as transient with logging
+					if (pollRes.status === 401 || pollRes.status === 403) {
+						yield {
+							type: "status",
+							mode: "background",
+							status: "failed",
+							responseId,
+						}
+						throw createTerminalBackgroundError(
+							`Polling unauthorized/forbidden (${pollRes.status}) for ${responseId}`,
+						)
+					}
+
+					console.warn?.("[openai-native] polling non-OK response", {
+						status: pollRes.status,
+						responseId,
+					})
 					await new Promise((r) => setTimeout(r, pollIntervalMs))
 					continue
 				}