More progress

cte · cte · commit c8a9375e8444 · 2025-05-22T22:40:48.000-07:00
diff --git a/src/api/__tests__/index.test.ts b/src/api/__tests__/index.test.ts
@@ -12,16 +12,20 @@ describe("getModelParams", () => {
 		}
 
 		const result = getModelParams({
-			options: {},
+			format: "openai",
+			settings: {},
 			model,
 			defaultMaxTokens: 1000,
 			defaultTemperature: 0.5,
 		})
 
 		expect(result).toEqual({
+			format: "openai",
 			maxTokens: 1000,
-			thinking: undefined,
 			temperature: 0.5,
+			reasoningEffort: undefined,
+			reasoningBudget: undefined,
+			reasoning: undefined,
 		})
 	})
 
@@ -32,16 +36,20 @@ describe("getModelParams", () => {
 		}
 
 		const result = getModelParams({
-			options: { modelTemperature: 0.7 },
+			format: "openai",
+			settings: { modelTemperature: 0.7 },
 			model,
 			defaultMaxTokens: 1000,
 			defaultTemperature: 0.5,
 		})
 
 		expect(result).toEqual({
+			format: "openai",
 			maxTokens: 1000,
-			thinking: undefined,
 			temperature: 0.7,
+			reasoningEffort: undefined,
+			reasoningBudget: undefined,
+			reasoning: undefined,
 		})
 	})
 
@@ -52,10 +60,13 @@ describe("getModelParams", () => {
 			supportsPromptCache: true,
 		}
 
-		expect(getModelParams({ options: {}, model, defaultMaxTokens: 1000 })).toEqual({
+		expect(getModelParams({ format: "openai", settings: {}, model, defaultMaxTokens: 1000 })).toEqual({
+			format: "openai",
 			maxTokens: 2000,
-			thinking: undefined,
 			temperature: 0,
+			reasoningEffort: undefined,
+			reasoningBudget: undefined,
+			reasoning: undefined,
 		})
 	})
 
@@ -67,10 +78,13 @@ describe("getModelParams", () => {
 			supportsReasoningBudget: true,
 		}
 
-		expect(getModelParams({ options: {}, model })).toEqual({
+		expect(getModelParams({ format: "openai", settings: {}, model })).toEqual({
+			format: "openai",
 			maxTokens: 2000,
-			reasoningBudget: 1600, // 80% of 2000,
 			temperature: 1.0, // Thinking models require temperature 1.0.
+			reasoningEffort: undefined,
+			reasoningBudget: 1600, // 80% of 2000,
+			reasoning: undefined,
 		})
 	})
 
@@ -81,10 +95,15 @@ describe("getModelParams", () => {
 			supportsReasoningBudget: true,
 		}
 
-		expect(getModelParams({ options: { modelMaxTokens: 3000 }, model, defaultMaxTokens: 2000 })).toEqual({
+		expect(
+			getModelParams({ format: "openai", settings: { modelMaxTokens: 3000 }, model, defaultMaxTokens: 2000 }),
+		).toEqual({
+			format: "openai",
 			maxTokens: 3000,
-			reasoningBudget: 2400, // 80% of 3000,
 			temperature: 1.0,
+			reasoningEffort: undefined,
+			reasoningBudget: 2400, // 80% of 3000,
+			reasoning: undefined,
 		})
 	})
 
@@ -96,10 +115,13 @@ describe("getModelParams", () => {
 			supportsReasoningBudget: true,
 		}
 
-		expect(getModelParams({ options: { modelMaxThinkingTokens: 1500 }, model })).toEqual({
+		expect(getModelParams({ format: "openai", settings: { modelMaxThinkingTokens: 1500 }, model })).toEqual({
+			format: "openai",
 			maxTokens: 4000,
-			reasoningBudget: 1500, // Using the custom value.
 			temperature: 1.0,
+			reasoningEffort: undefined,
+			reasoningBudget: 1500, // Using the custom value.
+			reasoning: undefined,
 		})
 	})
 
@@ -110,11 +132,13 @@ describe("getModelParams", () => {
 			supportsPromptCache: true,
 		}
 
-		expect(getModelParams({ options: { modelMaxThinkingTokens: 1500 }, model })).toEqual({
+		expect(getModelParams({ format: "openai", settings: { modelMaxThinkingTokens: 1500 }, model })).toEqual({
+			format: "openai",
 			maxTokens: 4000,
-			reasoningBudget: undefined, // Should remain undefined despite customMaxThinkingTokens being set.
-			reasoningEffort: undefined,
 			temperature: 0, // Using default temperature.
+			reasoningEffort: undefined,
+			reasoningBudget: undefined, // Should remain undefined despite customMaxThinkingTokens being set.
+			reasoning: undefined,
 		})
 	})
 
@@ -126,10 +150,13 @@ describe("getModelParams", () => {
 			supportsReasoningBudget: true,
 		}
 
-		expect(getModelParams({ options: { modelMaxThinkingTokens: 500 }, model })).toEqual({
+		expect(getModelParams({ format: "openai", settings: { modelMaxThinkingTokens: 500 }, model })).toEqual({
+			format: "openai",
 			maxTokens: 2000,
-			reasoningBudget: 1024, // Minimum is 1024
 			temperature: 1.0,
+			reasoningEffort: undefined,
+			reasoningBudget: 1024, // Minimum is 1024
+			reasoning: undefined,
 		})
 	})
 
@@ -141,10 +168,13 @@ describe("getModelParams", () => {
 			supportsReasoningBudget: true,
 		}
 
-		expect(getModelParams({ options: { modelMaxThinkingTokens: 5000 }, model })).toEqual({
+		expect(getModelParams({ format: "openai", settings: { modelMaxThinkingTokens: 5000 }, model })).toEqual({
+			format: "openai",
 			maxTokens: 4000,
-			reasoningBudget: 3200, // 80% of 4000
 			temperature: 1.0,
+			reasoningEffort: undefined,
+			reasoningBudget: 3200, // 80% of 4000
+			reasoning: undefined,
 		})
 	})
 
@@ -155,10 +185,13 @@ describe("getModelParams", () => {
 			supportsReasoningBudget: true,
 		}
 
-		expect(getModelParams({ options: {}, model })).toEqual({
+		expect(getModelParams({ format: "openai", settings: {}, model })).toEqual({
+			format: "openai",
 			maxTokens: undefined,
 			temperature: 1.0,
+			reasoningEffort: undefined,
 			reasoningBudget: Math.floor(ANTHROPIC_DEFAULT_MAX_TOKENS * 0.8),
+			reasoning: undefined,
 		})
 	})
 })
diff --git a/src/api/providers/anthropic-vertex.ts b/src/api/providers/anthropic-vertex.ts
@@ -7,7 +7,6 @@ import { safeJsonParse } from "../../shared/safeJsonParse"
 
 import { ApiStream } from "../transform/stream"
 import { addCacheBreakpoints } from "../transform/caching/vertex"
-import { getAnthropicReasoning } from "../transform/reasoning"
 import { getModelParams } from "../transform/model-params"
 
 import { ANTHROPIC_DEFAULT_MAX_TOKENS } from "./constants"
@@ -57,7 +56,7 @@ export class AnthropicVertexHandler extends BaseProvider implements SingleComple
 			info: { supportsPromptCache },
 			temperature,
 			maxTokens,
-			thinking,
+			reasoning: thinking,
 		} = this.getModel()
 
 		/**
@@ -158,18 +157,17 @@ export class AnthropicVertexHandler extends BaseProvider implements SingleComple
 		const info: ModelInfo = vertexModels[id]
 
 		const params = getModelParams({
-			options: this.options,
+			format: "anthropic",
+			settings: this.options,
 			model: info,
 			defaultMaxTokens: ANTHROPIC_DEFAULT_MAX_TOKENS,
 		})
 
-		const thinking = getAnthropicReasoning({ model: info, params, settings: this.options })
-
 		// The `:thinking` suffix indicates that the model is a "Hybrid"
 		// reasoning model and that reasoning is required to be enabled.
 		// The actual model ID honored by Anthropic's API does not have this
 		// suffix.
-		return { id: id.endsWith(":thinking") ? id.replace(":thinking", "") : id, info, ...params, thinking }
+		return { id: id.endsWith(":thinking") ? id.replace(":thinking", "") : id, info, ...params }
 	}
 
 	async completePrompt(prompt: string) {
@@ -179,7 +177,7 @@ export class AnthropicVertexHandler extends BaseProvider implements SingleComple
 				info: { supportsPromptCache },
 				temperature,
 				maxTokens = ANTHROPIC_DEFAULT_MAX_TOKENS,
-				thinking,
+				reasoning: thinking,
 			} = this.getModel()
 
 			const params: Anthropic.Messages.MessageCreateParamsNonStreaming = {
diff --git a/src/api/providers/anthropic.ts b/src/api/providers/anthropic.ts
@@ -11,7 +11,6 @@ import {
 } from "../../shared/api"
 
 import { ApiStream } from "../transform/stream"
-import { getAnthropicReasoning } from "../transform/reasoning"
 import { getModelParams } from "../transform/model-params"
 
 import { ANTHROPIC_DEFAULT_MAX_TOKENS } from "./constants"
@@ -38,7 +37,7 @@ export class AnthropicHandler extends BaseProvider implements SingleCompletionHa
 	async *createMessage(systemPrompt: string, messages: Anthropic.Messages.MessageParam[]): ApiStream {
 		let stream: AnthropicStream<Anthropic.Messages.RawMessageStreamEvent>
 		const cacheControl: CacheControlEphemeral = { type: "ephemeral" }
-		let { id: modelId, betas = [], maxTokens, temperature, thinking } = this.getModel()
+		let { id: modelId, betas = [], maxTokens, temperature, reasoning: thinking } = this.getModel()
 
 		switch (modelId) {
 			case "claude-sonnet-4-20250514":
@@ -202,13 +201,12 @@ export class AnthropicHandler extends BaseProvider implements SingleCompletionHa
 		const info: ModelInfo = anthropicModels[id]
 
 		const params = getModelParams({
-			options: this.options,
+			format: "anthropic",
+			settings: this.options,
 			model: info,
 			defaultMaxTokens: ANTHROPIC_DEFAULT_MAX_TOKENS,
 		})
 
-		const thinking = getAnthropicReasoning({ model: info, params, settings: this.options })
-
 		// The `:thinking` suffix indicates that the model is a "Hybrid"
 		// reasoning model and that reasoning is required to be enabled.
 		// The actual model ID honored by Anthropic's API does not have this
@@ -218,7 +216,6 @@ export class AnthropicHandler extends BaseProvider implements SingleCompletionHa
 			info,
 			betas: id === "claude-3-7-sonnet-20250219:thinking" ? ["output-128k-2025-02-19"] : undefined,
 			...params,
-			thinking,
 		}
 	}
 
diff --git a/src/api/providers/deepseek.ts b/src/api/providers/deepseek.ts
@@ -3,7 +3,6 @@ import type { ApiHandlerOptions } from "../../shared/api"
 
 import type { ApiStreamUsageChunk } from "../transform/stream"
 import { getModelParams } from "../transform/model-params"
-import { getOpenAiReasoning } from "../transform/reasoning"
 
 import { OpenAiHandler } from "./openai"
 
@@ -22,9 +21,8 @@ export class DeepSeekHandler extends OpenAiHandler {
 	override getModel() {
 		const modelId = this.options.apiModelId ?? deepSeekDefaultModelId
 		const info = deepSeekModels[modelId as keyof typeof deepSeekModels] || deepSeekModels[deepSeekDefaultModelId]
-		const params = getModelParams({ options: this.options, model: info })
-		const reasoning = getOpenAiReasoning({ model: info, params, settings: this.options })
-		return { id: modelId, info, ...params, reasoning }
+		const params = getModelParams({ format: "openai", settings: this.options, model: info })
+		return { id: modelId, info, ...params }
 	}
 
 	// Override to handle DeepSeek's usage metrics, including caching.
diff --git a/src/api/providers/openai-native.ts b/src/api/providers/openai-native.ts
@@ -14,7 +14,6 @@ import { calculateApiCostOpenAI } from "../../utils/cost"
 import { convertToOpenAiMessages } from "../transform/openai-format"
 import { ApiStream } from "../transform/stream"
 import { getModelParams } from "../transform/model-params"
-import { getOpenAiReasoning } from "../transform/reasoning"
 
 import type { SingleCompletionHandler } from "../index"
 import { BaseProvider } from "./base-provider"
@@ -166,23 +165,21 @@ export class OpenAiNativeHandler extends BaseProvider implements SingleCompletio
 
 		const info: ModelInfo = openAiNativeModels[id]
 
-		const params = getModelParams({
-			options: this.options,
+		const { temperature, ...params } = getModelParams({
+			format: "openai",
+			settings: this.options,
 			model: info,
 			defaultTemperature: OPENAI_NATIVE_DEFAULT_TEMPERATURE,
 		})
 
-		const reasoning = getOpenAiReasoning({ model: info, params, settings: this.options })
-
 		// The o3 models are named like "o3-mini-[reasoning-effort]", which are
 		// not valid model ids, so we need to strip the suffix.
 		// Also note that temperature is not supported for o1 and o3-mini.
 		return {
 			id: id.startsWith("o3-mini") ? "o3-mini" : id,
 			info,
 			...params,
-			temperature: id.startsWith("o1") || id.startsWith("o3-mini") ? undefined : params.temperature,
-			reasoning,
+			temperature: id.startsWith("o1") || id.startsWith("o3-mini") ? undefined : temperature,
 		}
 	}
 
diff --git a/src/api/providers/openai.ts b/src/api/providers/openai.ts
@@ -15,7 +15,6 @@ import { convertToOpenAiMessages } from "../transform/openai-format"
 import { convertToR1Format } from "../transform/r1-format"
 import { convertToSimpleMessages } from "../transform/simple-format"
 import { ApiStream, ApiStreamUsageChunk } from "../transform/stream"
-import { getOpenAiReasoning } from "../transform/reasoning"
 import { getModelParams } from "../transform/model-params"
 
 import { DEFAULT_HEADERS, DEEP_SEEK_DEFAULT_TEMPERATURE } from "./constants"
@@ -241,9 +240,8 @@ export class OpenAiHandler extends BaseProvider implements SingleCompletionHandl
 	override getModel() {
 		const id = this.options.openAiModelId ?? ""
 		const info = this.options.openAiCustomModelInfo ?? openAiModelInfoSaneDefaults
-		const params = getModelParams({ options: this.options, model: info })
-		const reasoning = getOpenAiReasoning({ model: info, params, settings: this.options })
-		return { id, info, ...params, reasoning }
+		const params = getModelParams({ format: "openai", settings: this.options, model: info })
+		return { id, info, ...params }
 	}
 
 	async completePrompt(prompt: string): Promise<string> {
diff --git a/src/api/providers/openrouter.ts b/src/api/providers/openrouter.ts
@@ -14,7 +14,7 @@ import { ApiStreamChunk } from "../transform/stream"
 import { convertToR1Format } from "../transform/r1-format"
 import { addCacheBreakpoints as addAnthropicCacheBreakpoints } from "../transform/caching/anthropic"
 import { addCacheBreakpoints as addGeminiCacheBreakpoints } from "../transform/caching/gemini"
-import { type OpenRouterReasoningParams, getOpenRouterReasoning } from "../transform/reasoning"
+import type { OpenRouterReasoningParams } from "../transform/reasoning"
 import { getModelParams } from "../transform/model-params"
 
 import { getModels } from "./fetchers/modelCache"
@@ -189,9 +189,8 @@ export class OpenRouterHandler extends BaseProvider implements SingleCompletionH
 
 		const isDeepSeekR1 = id.startsWith("deepseek/deepseek-r1") || id === "perplexity/sonar-reasoning"
 		const defaultTemperature = isDeepSeekR1 ? DEEP_SEEK_DEFAULT_TEMPERATURE : 0
-		const params = getModelParams({ options: this.options, model: info, defaultTemperature })
-		const reasoning = getOpenRouterReasoning({ model: info, params, settings: this.options })
-		return { id, info, topP: isDeepSeekR1 ? 0.95 : undefined, ...params, reasoning }
+		const params = getModelParams({ format: "openrouter", settings: this.options, model: info, defaultTemperature })
+		return { id, info, topP: isDeepSeekR1 ? 0.95 : undefined, ...params }
 	}
 
 	async completePrompt(prompt: string) {
diff --git a/src/api/providers/xai.ts b/src/api/providers/xai.ts
@@ -5,7 +5,6 @@ import { ApiHandlerOptions, XAIModelId, xaiDefaultModelId, xaiModels } from "../
 
 import { ApiStream } from "../transform/stream"
 import { convertToOpenAiMessages } from "../transform/openai-format"
-import { getOpenAiReasoning } from "../transform/reasoning"
 import { getModelParams } from "../transform/model-params"
 
 import { DEFAULT_HEADERS } from "./constants"
@@ -35,9 +34,8 @@ export class XAIHandler extends BaseProvider implements SingleCompletionHandler
 				: xaiDefaultModelId
 
 		const info = xaiModels[id]
-		const params = getModelParams({ options: this.options, model: info })
-		const reasoning = getOpenAiReasoning({ model: info, params, settings: this.options })
-		return { id, info, ...params, reasoning }
+		const params = getModelParams({ format: "openai", settings: this.options, model: info })
+		return { id, info, ...params }
 	}
 
 	override async *createMessage(systemPrompt: string, messages: Anthropic.Messages.MessageParam[]): ApiStream {
diff --git a/src/api/transform/model-params.ts b/src/api/transform/model-params.ts
diff --git a/src/api/transform/reasoning.ts b/src/api/transform/reasoning.ts