RooCodeInc · ertan2002 · Sep 30, 2025 · Sep 30, 2025 · Sep 30, 2025 · Sep 30, 2025
@@ -35,7 +35,7 @@
 - [简体中文](locales/zh-CN/README.md)
 - [繁體中文](locales/zh-TW/README.md)
 - ...
-      </details>
+    </details>
 
 ---
 

@@ -58,6 +58,42 @@ vi.mock("../fetchers/io-intelligence", () => ({
 	})),
 }))
 
+// Mock the model cache
+vi.mock("../fetchers/modelCache", () => ({
+	getModels: vi.fn().mockImplementation(() => {
+		return Promise.resolve({
+			"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": {
+				maxTokens: 8192,
+				contextWindow: 430000,
+				description: "Llama 4 Maverick 17B model",
+				supportsImages: true,
+				supportsPromptCache: false,
+			},
+			"deepseek-ai/DeepSeek-R1-0528": {
+				maxTokens: 8192,
+				contextWindow: 128000,
+				supportsImages: false,
+				supportsPromptCache: false,
+				description: "DeepSeek R1 reasoning model",
+			},
+			"Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar": {
+				maxTokens: 4096,
+				contextWindow: 106000,
+				supportsImages: false,
+				supportsPromptCache: false,
+				description: "Qwen3 Coder 480B specialized for coding",
+			},
+			"openai/gpt-oss-120b": {
+				maxTokens: 8192,
+				contextWindow: 131072,
+				supportsImages: false,
+				supportsPromptCache: false,
+				description: "OpenAI GPT-OSS 120B model",
+			},
+		})
+	}),
+}))
+
 // Mock constants
 vi.mock("../constants", () => ({
 	DEFAULT_HEADERS: { "User-Agent": "roo-cline" },
@@ -72,11 +108,11 @@ describe("IOIntelligenceHandler", () => {
 	let handler: IOIntelligenceHandler
 	let mockOptions: ApiHandlerOptions
 
-	beforeEach(() => {
+	beforeEach(async () => {
 		vi.clearAllMocks()
 		mockOptions = {
 			ioIntelligenceApiKey: "test-api-key",
-			apiModelId: "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
+			ioIntelligenceModelId: "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
 			modelTemperature: 0.7,
 			includeMaxTokens: false,
 			modelMaxTokens: undefined,
@@ -129,17 +165,19 @@ describe("IOIntelligenceHandler", () => {
 	it("should initialize with correct configuration", () => {
 		expect(handler).toBeInstanceOf(IOIntelligenceHandler)
 		expect(handler["client"]).toBeDefined()
-		expect(handler["options"]).toEqual({
-			...mockOptions,
-			apiKey: mockOptions.ioIntelligenceApiKey,
-		})
+		expect(handler["options"]).toEqual(mockOptions)
 	})
 
-	it("should throw error when API key is missing", () => {
+	it("should allow handler creation without API key for model fetching", () => {
 		const optionsWithoutKey = { ...mockOptions }
 		delete optionsWithoutKey.ioIntelligenceApiKey
 
-		expect(() => new IOIntelligenceHandler(optionsWithoutKey)).toThrow("IO Intelligence API key is required")
+		// Handler can be created without API key (validation happens at UI level)
+		const handlerWithoutKey = new IOIntelligenceHandler(optionsWithoutKey)
+		expect(handlerWithoutKey).toBeInstanceOf(IOIntelligenceHandler)
+		expect(handlerWithoutKey["client"]).toBeDefined()
+		// Client should have a placeholder API key
+		expect(handlerWithoutKey["client"].apiKey).toBe("not-provided")
 	})
 
 	it("should handle streaming response correctly", async () => {

@@ -1,9 +1,8 @@
 import axios from "axios"
 import { z } from "zod"
-
 import { type ModelInfo, IO_INTELLIGENCE_CACHE_DURATION } from "@roo-code/types"
-
 import type { ModelRecord } from "../../../shared/api"
+import { parseApiPrice } from "../../../shared/cost"
 
 const ioIntelligenceModelSchema = z.object({
 	id: z.string(),
@@ -29,6 +28,15 @@ const ioIntelligenceModelSchema = z.object({
 			is_blocking: z.boolean(),
 		}),
 	),
+	max_tokens: z.number().nullable().optional(),
+	context_window: z.number().optional(),
+	supports_images_input: z.boolean().optional().default(false),
+	supports_prompt_cache: z.boolean().optional().default(false),
+	input_token_price: z.number().nullable().optional(),
+	output_token_price: z.number().nullable().optional(),
+	cache_write_token_price: z.number().nullable().optional(),
+	cache_read_token_price: z.number().nullable().optional(),
+	precision: z.string().nullable().optional(),
 })
 
 export type IOIntelligenceModel = z.infer<typeof ioIntelligenceModelSchema>
@@ -47,34 +55,21 @@ interface CacheEntry {
 
 let cache: CacheEntry | null = null
 
-/**
- * Model context length mapping based on the documentation
- * <mcreference link="https://docs.io.net/reference/get-started-with-io-intelligence-api" index="1">1</mcreference>
- */
-const MODEL_CONTEXT_LENGTHS: Record<string, number> = {
-	"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": 430000,
-	"deepseek-ai/DeepSeek-R1-0528": 128000,
-	"Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar": 106000,
-	"openai/gpt-oss-120b": 131072,
-}
-
-const VISION_MODELS = new Set([
-	"Qwen/Qwen2.5-VL-32B-Instruct",
-	"meta-llama/Llama-3.2-90B-Vision-Instruct",
-	"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
-])
-
 function parseIOIntelligenceModel(model: IOIntelligenceModel): ModelInfo {
-	const contextLength = MODEL_CONTEXT_LENGTHS[model.id] || 8192
-	// Cap maxTokens at 32k for very large context windows, or 20% of context length, whichever is smaller.
-	const maxTokens = Math.min(contextLength, Math.ceil(contextLength * 0.2), 32768)
-	const supportsImages = VISION_MODELS.has(model.id)
+	const contextWindow = model.context_window ?? model.max_model_len ?? 8192
+
+	// Use API max_tokens if provided, otherwise calculate 20% of context window
+	const maxTokens = model.max_tokens && model.max_tokens > 0 ? model.max_tokens : Math.ceil(contextWindow * 0.2)
 
 	return {
 		maxTokens,
-		contextWindow: contextLength,
-		supportsImages,
-		supportsPromptCache: false,
+		contextWindow,
+		supportsImages: model.supports_images_input,
+		supportsPromptCache: model.supports_prompt_cache,
+		inputPrice: parseApiPrice(model.input_token_price),
+		outputPrice: parseApiPrice(model.output_token_price),
+		cacheWritesPrice: parseApiPrice(model.cache_write_token_price),
+		cacheReadsPrice: parseApiPrice(model.cache_read_token_price),
 		description: `${model.id} via IO Intelligence`,
 	}
 }
@@ -97,18 +92,17 @@ export async function getIOIntelligenceModels(apiKey?: string): Promise<ModelRec
 			"Content-Type": "application/json",
 		}
 
+		// Note: IO Intelligence models endpoint does not require authentication
+		// API key is optional for future use if needed
 		if (apiKey) {
 			headers.Authorization = `Bearer ${apiKey}`
-		} else {
-			console.error("IO Intelligence API key is required")
-			throw new Error("IO Intelligence API key is required")
 		}
 
 		const response = await axios.get<IOIntelligenceApiResponse>(
 			"https://api.intelligence.io.solutions/api/v1/models",
 			{
 				headers,
-				timeout: 10_000,
+				timeout: 10000,
 			},
 		)