fix: update OpenAI provider to use tiers array format for service tier pricing

daniel-lxs · daniel-lxs · commit d9ec2484642e · 2025-09-04T12:46:22.000-05:00
diff --git a/packages/types/src/providers/openai.ts b/packages/types/src/providers/openai.ts
@@ -32,11 +32,10 @@ export const openAiNativeModels = {
 		// supportsVerbosity is a new capability; ensure ModelInfo includes it
 		supportsVerbosity: true,
 		supportsTemperature: false,
-		allowedServiceTiers: ["flex", "priority"],
-		serviceTierPricing: {
-			flex: { inputPrice: 0.625, outputPrice: 5.0, cacheReadsPrice: 0.0625 },
-			priority: { inputPrice: 2.5, outputPrice: 20.0, cacheReadsPrice: 0.25 },
-		},
+		tiers: [
+			{ name: "flex", contextWindow: 400000, inputPrice: 0.625, outputPrice: 5.0, cacheReadsPrice: 0.0625 },
+			{ name: "priority", contextWindow: 400000, inputPrice: 2.5, outputPrice: 20.0, cacheReadsPrice: 0.25 },
+		],
 	},
 	"gpt-5-mini-2025-08-07": {
 		maxTokens: 128000,
@@ -51,11 +50,10 @@ export const openAiNativeModels = {
 		description: "GPT-5 Mini: A faster, more cost-efficient version of GPT-5 for well-defined tasks",
 		supportsVerbosity: true,
 		supportsTemperature: false,
-		allowedServiceTiers: ["flex", "priority"],
-		serviceTierPricing: {
-			flex: { inputPrice: 0.125, outputPrice: 1.0, cacheReadsPrice: 0.0125 },
-			priority: { inputPrice: 0.45, outputPrice: 3.6, cacheReadsPrice: 0.045 },
-		},
+		tiers: [
+			{ name: "flex", contextWindow: 400000, inputPrice: 0.125, outputPrice: 1.0, cacheReadsPrice: 0.0125 },
+			{ name: "priority", contextWindow: 400000, inputPrice: 0.45, outputPrice: 3.6, cacheReadsPrice: 0.045 },
+		],
 	},
 	"gpt-5-nano-2025-08-07": {
 		maxTokens: 128000,
@@ -70,10 +68,7 @@ export const openAiNativeModels = {
 		description: "GPT-5 Nano: Fastest, most cost-efficient version of GPT-5",
 		supportsVerbosity: true,
 		supportsTemperature: false,
-		allowedServiceTiers: ["flex"],
-		serviceTierPricing: {
-			flex: { inputPrice: 0.025, outputPrice: 0.2, cacheReadsPrice: 0.0025 },
-		},
+		tiers: [{ name: "flex", contextWindow: 400000, inputPrice: 0.025, outputPrice: 0.2, cacheReadsPrice: 0.0025 }],
 	},
 	"gpt-4.1": {
 		maxTokens: 32_768,
@@ -84,10 +79,9 @@ export const openAiNativeModels = {
 		outputPrice: 8,
 		cacheReadsPrice: 0.5,
 		supportsTemperature: true,
-		allowedServiceTiers: ["priority"],
-		serviceTierPricing: {
-			priority: { inputPrice: 3.5, outputPrice: 14.0, cacheReadsPrice: 0.875 },
-		},
+		tiers: [
+			{ name: "priority", contextWindow: 1_047_576, inputPrice: 3.5, outputPrice: 14.0, cacheReadsPrice: 0.875 },
+		],
 	},
 	"gpt-4.1-mini": {
 		maxTokens: 32_768,
@@ -98,10 +92,9 @@ export const openAiNativeModels = {
 		outputPrice: 1.6,
 		cacheReadsPrice: 0.1,
 		supportsTemperature: true,
-		allowedServiceTiers: ["priority"],
-		serviceTierPricing: {
-			priority: { inputPrice: 0.7, outputPrice: 2.8, cacheReadsPrice: 0.175 },
-		},
+		tiers: [
+			{ name: "priority", contextWindow: 1_047_576, inputPrice: 0.7, outputPrice: 2.8, cacheReadsPrice: 0.175 },
+		],
 	},
 	"gpt-4.1-nano": {
 		maxTokens: 32_768,
@@ -112,10 +105,9 @@ export const openAiNativeModels = {
 		outputPrice: 0.4,
 		cacheReadsPrice: 0.025,
 		supportsTemperature: true,
-		allowedServiceTiers: ["priority"],
-		serviceTierPricing: {
-			priority: { inputPrice: 0.2, outputPrice: 0.8, cacheReadsPrice: 0.05 },
-		},
+		tiers: [
+			{ name: "priority", contextWindow: 1_047_576, inputPrice: 0.2, outputPrice: 0.8, cacheReadsPrice: 0.05 },
+		],
 	},
 	o3: {
 		maxTokens: 100_000,
@@ -128,11 +120,10 @@ export const openAiNativeModels = {
 		supportsReasoningEffort: true,
 		reasoningEffort: "medium",
 		supportsTemperature: false,
-		allowedServiceTiers: ["flex", "priority"],
-		serviceTierPricing: {
-			flex: { inputPrice: 1.0, outputPrice: 4.0, cacheReadsPrice: 0.25 },
-			priority: { inputPrice: 3.5, outputPrice: 14.0, cacheReadsPrice: 0.875 },
-		},
+		tiers: [
+			{ name: "flex", contextWindow: 200_000, inputPrice: 1.0, outputPrice: 4.0, cacheReadsPrice: 0.25 },
+			{ name: "priority", contextWindow: 200_000, inputPrice: 3.5, outputPrice: 14.0, cacheReadsPrice: 0.875 },
+		],
 	},
 	"o3-high": {
 		maxTokens: 100_000,
@@ -167,11 +158,10 @@ export const openAiNativeModels = {
 		supportsReasoningEffort: true,
 		reasoningEffort: "medium",
 		supportsTemperature: false,
-		allowedServiceTiers: ["flex", "priority"],
-		serviceTierPricing: {
-			flex: { inputPrice: 0.55, outputPrice: 2.2, cacheReadsPrice: 0.138 },
-			priority: { inputPrice: 2.0, outputPrice: 8.0, cacheReadsPrice: 0.5 },
-		},
+		tiers: [
+			{ name: "flex", contextWindow: 200_000, inputPrice: 0.55, outputPrice: 2.2, cacheReadsPrice: 0.138 },
+			{ name: "priority", contextWindow: 200_000, inputPrice: 2.0, outputPrice: 8.0, cacheReadsPrice: 0.5 },
+		],
 	},
 	"o4-mini-high": {
 		maxTokens: 100_000,
@@ -268,10 +258,9 @@ export const openAiNativeModels = {
 		outputPrice: 10,
 		cacheReadsPrice: 1.25,
 		supportsTemperature: true,
-		allowedServiceTiers: ["priority"],
-		serviceTierPricing: {
-			priority: { inputPrice: 4.25, outputPrice: 17.0, cacheReadsPrice: 2.125 },
-		},
+		tiers: [
+			{ name: "priority", contextWindow: 128_000, inputPrice: 4.25, outputPrice: 17.0, cacheReadsPrice: 2.125 },
+		],
 	},
 	"gpt-4o-mini": {
 		maxTokens: 16_384,
@@ -282,10 +271,9 @@ export const openAiNativeModels = {
 		outputPrice: 0.6,
 		cacheReadsPrice: 0.075,
 		supportsTemperature: true,
-		allowedServiceTiers: ["priority"],
-		serviceTierPricing: {
-			priority: { inputPrice: 0.25, outputPrice: 1.0, cacheReadsPrice: 0.125 },
-		},
+		tiers: [
+			{ name: "priority", contextWindow: 128_000, inputPrice: 0.25, outputPrice: 1.0, cacheReadsPrice: 0.125 },
+		],
 	},
 	"codex-mini-latest": {
 		maxTokens: 16_384,