RooCodeInc
diff --git a/‎packages/types/src/provider-settings.ts‎
Lines changed: 14 additions & 0 deletions b/‎packages/types/src/provider-settings.ts‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎packages/types/src/providers/helicone.ts‎
Lines changed: 20 additions & 0 deletions b/‎packages/types/src/providers/helicone.ts‎
Lines changed: 20 additions & 0 deletions
diff --git a/‎packages/types/src/providers/index.ts‎
Lines changed: 1 addition & 0 deletions b/‎packages/types/src/providers/index.ts‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/api/index.ts‎
Lines changed: 3 additions & 0 deletions b/‎src/api/index.ts‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎src/api/providers/helicone.ts‎
Lines changed: 168 additions & 0 deletions b/‎src/api/providers/helicone.ts‎
Lines changed: 168 additions & 0 deletions
diff --git a/‎src/api/providers/index.ts‎
Lines changed: 1 addition & 0 deletions b/‎src/api/providers/index.ts‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎webview-ui/src/components/settings/ApiOptions.tsx‎
Lines changed: 12 additions & 0 deletions b/‎webview-ui/src/components/settings/ApiOptions.tsx‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎webview-ui/src/components/settings/constants.ts‎
Lines changed: 3 additions & 0 deletions b/‎webview-ui/src/components/settings/constants.ts‎
Lines changed: 3 additions & 0 deletions
@@ -14,6 +14,7 @@ import {
 	fireworksModels,
 	geminiModels,
 	groqModels,
+	heliconeModels,
 	ioIntelligenceModels,
 	mistralModels,
 	moonshotModels,
@@ -129,6 +130,7 @@ export const providerNames = [
 	"gemini",
 	"gemini-cli",
 	"groq",
+	"helicone",
 	"mistral",
 	"moonshot",
 	"openai-native",
@@ -213,6 +215,13 @@ const openRouterSchema = baseProviderSettingsSchema.extend({
 	openRouterUseMiddleOutTransform: z.boolean().optional(),
 })
 
+const heliconeSchema = baseProviderSettingsSchema.extend({
+	heliconeApiKey: z.string().optional(),
+	heliconeModelId: z.string().optional(),
+	heliconeBaseUrl: z.string().optional(),
+	heliconeSpecificProvider: z.string().optional(),
+})
+
 const bedrockSchema = apiModelIdProviderModelSchema.extend({
 	awsAccessKey: z.string().optional(),
 	awsSecretKey: z.string().optional(),
@@ -421,6 +430,7 @@ export const providerSettingsSchemaDiscriminated = z.discriminatedUnion("apiProv
 	claudeCodeSchema.merge(z.object({ apiProvider: z.literal("claude-code") })),
 	glamaSchema.merge(z.object({ apiProvider: z.literal("glama") })),
 	openRouterSchema.merge(z.object({ apiProvider: z.literal("openrouter") })),
+	heliconeSchema.merge(z.object({ apiProvider: z.literal("helicone") })),
 	bedrockSchema.merge(z.object({ apiProvider: z.literal("bedrock") })),
 	vertexSchema.merge(z.object({ apiProvider: z.literal("vertex") })),
 	openAiSchema.merge(z.object({ apiProvider: z.literal("openai") })),
@@ -462,6 +472,7 @@ export const providerSettingsSchema = z.object({
 	...claudeCodeSchema.shape,
 	...glamaSchema.shape,
 	...openRouterSchema.shape,
+	...heliconeSchema.shape,
 	...bedrockSchema.shape,
 	...vertexSchema.shape,
 	...openAiSchema.shape,
@@ -517,6 +528,7 @@ export const modelIdKeys = [
 	"apiModelId",
 	"glamaModelId",
 	"openRouterModelId",
+	"heliconeModelId",
 	"openAiModelId",
 	"ollamaModelId",
 	"lmStudioModelId",
@@ -551,6 +563,7 @@ export const modelIdKeysByProvider: Record<TypicalProvider, ModelIdKey> = {
 	"claude-code": "apiModelId",
 	glama: "glamaModelId",
 	openrouter: "openRouterModelId",
+	helicone: "apiModelId",
 	bedrock: "apiModelId",
 	vertex: "apiModelId",
 	"openai-native": "openAiModelId",
@@ -656,6 +669,7 @@ export const MODELS_BY_PROVIDER: Record<
 		models: Object.keys(geminiModels),
 	},
 	groq: { id: "groq", label: "Groq", models: Object.keys(groqModels) },
+	helicone: { id: "helicone", label: "Helicone", models: Object.keys(heliconeModels) },
 	"io-intelligence": {
 		id: "io-intelligence",
 		label: "IO Intelligence",
 
@@ -0,0 +1,20 @@
+import type { ModelInfo } from "../model.js"
+
+// Helicone is OpenAI-compatible and uses name/provider model IDs.
+// TODO [HELICONE]: change this to claude-4.5-sonnet/anthropic as Roo Code is optimized for that
+export const heliconeDefaultModelId = "gpt-4o/openai"
+
+export const heliconeDefaultModelInfo: ModelInfo = {
+	maxTokens: 16_384,
+	contextWindow: 128_000,
+	supportsImages: true,
+	supportsPromptCache: true,
+	inputPrice: 5.0,
+	outputPrice: 20.0,
+	cacheReadsPrice: 2.5,
+	description: "GPT-4o via Helicone AI Gateway.",
+}
+
+export const heliconeModels = {
+	"gpt-4o/openai": heliconeDefaultModelInfo,
+} as const
@@ -19,6 +19,7 @@ export * from "./moonshot.js"
 export * from "./ollama.js"
 export * from "./openai.js"
 export * from "./openrouter.js"
+export * from "./helicone.js"
 export * from "./qwen-code.js"
 export * from "./requesty.js"
 export * from "./roo.js"
 
@@ -40,6 +40,7 @@ import {
 	FeatherlessHandler,
 	VercelAiGatewayHandler,
 	DeepInfraHandler,
+	HeliconeHandler,
 } from "./providers"
 import { NativeOllamaHandler } from "./providers/native-ollama"
 
@@ -99,6 +100,8 @@ export function buildApiHandler(configuration: ProviderSettings): ApiHandler {
 			return new GlamaHandler(options)
 		case "openrouter":
 			return new OpenRouterHandler(options)
+		case "helicone":
+			return new HeliconeHandler(options)
 		case "bedrock":
 			return new AwsBedrockHandler(options)
 		case "vertex":
 
@@ -0,0 +1,168 @@
+import { Anthropic } from "@anthropic-ai/sdk"
+import OpenAI from "openai"
+
+import {
+	heliconeDefaultModelId,
+	heliconeDefaultModelInfo,
+	heliconeModels,
+	DEEP_SEEK_DEFAULT_TEMPERATURE,
+} from "@roo-code/types"
+
+import type { ApiHandlerOptions, ModelRecord } from "../../shared/api"
+
+import { convertToOpenAiMessages } from "../transform/openai-format"
+import { ApiStreamChunk } from "../transform/stream"
+import { convertToR1Format } from "../transform/r1-format"
+import { getModelParams } from "../transform/model-params"
+
+import { DEFAULT_HEADERS } from "./constants"
+import { BaseProvider } from "./base-provider"
+import type { SingleCompletionHandler } from "../index"
+import { handleOpenAIError } from "./utils/openai-error-handler"
+
+export class HeliconeHandler extends BaseProvider implements SingleCompletionHandler {
+	protected options: ApiHandlerOptions
+	private client: OpenAI
+	protected models: ModelRecord = {}
+	private readonly providerName = "Helicone"
+
+	constructor(options: ApiHandlerOptions) {
+		super()
+		this.options = options
+
+		const baseURL = this.options.heliconeBaseUrl || "https://ai-gateway.helicone.ai/v1"
+		const apiKey = this.options.heliconeApiKey ?? "not-provided"
+
+		this.client = new OpenAI({ baseURL, apiKey, defaultHeaders: DEFAULT_HEADERS })
+	}
+
+	override async *createMessage(
+		systemPrompt: string,
+		messages: Anthropic.Messages.MessageParam[],
+	): AsyncGenerator<ApiStreamChunk> {
+		const model = await this.fetchModel()
+
+		let { id: modelId, maxTokens, temperature } = model
+
+		// Convert Anthropic messages to OpenAI format.
+		let openAiMessages: OpenAI.Chat.ChatCompletionMessageParam[] = [
+			{ role: "system", content: systemPrompt },
+			...convertToOpenAiMessages(messages),
+		]
+
+		// DeepSeek and similar reasoning models recommend using user instead of system role.
+		if (this.isDeepSeekR1(modelId) || this.isPerplexityReasoning(modelId)) {
+			openAiMessages = convertToR1Format([{ role: "user", content: systemPrompt }, ...messages])
+			// DeepSeek recommended default temperature
+			temperature = this.options.modelTemperature ?? DEEP_SEEK_DEFAULT_TEMPERATURE
+		}
+
+		// TODO [HELICONE]: add automatic gemini/anthropic cache breakpoints
+
+		const completionParams: OpenAI.Chat.Completions.ChatCompletionCreateParamsStreaming = {
+			model: modelId,
+			...(maxTokens && maxTokens > 0 && { max_tokens: maxTokens }),
+			temperature,
+			messages: openAiMessages,
+			stream: true,
+			stream_options: { include_usage: true },
+		}
+
+		let stream
+		try {
+			stream = await this.client.chat.completions.create(completionParams)
+		} catch (error) {
+			throw handleOpenAIError(error, this.providerName)
+		}
+
+		let lastUsage: any | undefined = undefined
+
+		for await (const chunk of stream) {
+			const delta = chunk.choices[0]?.delta
+
+			if (
+				"reasoning" in (delta || {}) &&
+				(delta as any).reasoning &&
+				typeof (delta as any).reasoning === "string"
+			) {
+				yield { type: "reasoning", text: (delta as any).reasoning as string }
+			}
+
+			if (delta?.content) {
+				yield { type: "text", text: delta.content }
+			}
+
+			if (chunk.usage) {
+				lastUsage = chunk.usage
+			}
+		}
+
+		if (lastUsage) {
+			yield {
+				type: "usage",
+				inputTokens: lastUsage.prompt_tokens || 0,
+				outputTokens: lastUsage.completion_tokens || 0,
+				cacheReadTokens: lastUsage.prompt_tokens_details?.cached_tokens,
+				reasoningTokens: lastUsage.completion_tokens_details?.reasoning_tokens,
+			}
+		}
+	}
+
+	public async fetchModel() {
+		this.models = heliconeModels as unknown as ModelRecord
+		return this.getModel()
+	}
+
+	override getModel() {
+		const id = this.options.apiModelId ?? heliconeDefaultModelId
+		const info = this.models[id] ?? heliconeDefaultModelInfo
+
+		const params = getModelParams({
+			format: "openai",
+			modelId: id,
+			model: info,
+			settings: this.options,
+			defaultTemperature:
+				this.isDeepSeekR1(id) || this.isPerplexityReasoning(id) ? DEEP_SEEK_DEFAULT_TEMPERATURE : 0,
+		})
+
+		// Apply a small topP tweak for DeepSeek-style reasoning models
+		const topP = this.isDeepSeekR1(id) || this.isPerplexityReasoning(id) ? 0.95 : undefined
+		return { id, info, topP, ...params }
+	}
+
+	async completePrompt(prompt: string) {
+		let { id: modelId, maxTokens, temperature } = await this.fetchModel()
+
+		const completionParams: OpenAI.Chat.Completions.ChatCompletionCreateParamsNonStreaming = {
+			model: modelId,
+			...(maxTokens && maxTokens > 0 && { max_tokens: maxTokens }),
+			temperature,
+			messages: [{ role: "user", content: prompt }],
+			stream: false,
+		}
+
+		let response
+		try {
+			response = await this.client.chat.completions.create(completionParams)
+		} catch (error) {
+			throw handleOpenAIError(error, this.providerName)
+		}
+
+		if ("error" in (response as any)) {
+			const error = (response as any).error as { message?: string; code?: number }
+			throw new Error(`Helicone API Error ${error?.code}: ${error?.message}`)
+		}
+
+		const completion = response as OpenAI.Chat.ChatCompletion
+		return completion.choices[0]?.message?.content || ""
+	}
+
+	private isDeepSeekR1(modelId: string): boolean {
+		return modelId.includes("deepseek-r1")
+	}
+
+	private isPerplexityReasoning(modelId: string): boolean {
+		return modelId.includes("sonar-reasoning")
+	}
+}
@@ -34,3 +34,4 @@ export { RooHandler } from "./roo"
 export { FeatherlessHandler } from "./featherless"
 export { VercelAiGatewayHandler } from "./vercel-ai-gateway"
 export { DeepInfraHandler } from "./deepinfra"
+export { HeliconeHandler } from "./helicone"
@@ -37,6 +37,7 @@ import {
 	rooDefaultModelId,
 	vercelAiGatewayDefaultModelId,
 	deepInfraDefaultModelId,
+	heliconeDefaultModelId,
 } from "@roo-code/types"
 
 import { vscode } from "@src/utils/vscode"
@@ -83,6 +84,7 @@ import {
 	OpenAI,
 	OpenAICompatible,
 	OpenRouter,
+	Helicone,
 	QwenCode,
 	Requesty,
 	SambaNova,
@@ -322,6 +324,7 @@ const ApiOptions = ({
 			> = {
 				deepinfra: { field: "deepInfraModelId", default: deepInfraDefaultModelId },
 				openrouter: { field: "openRouterModelId", default: openRouterDefaultModelId },
+				helicone: { field: "heliconeModelId", default: heliconeDefaultModelId },
 				glama: { field: "glamaModelId", default: glamaDefaultModelId },
 				unbound: { field: "unboundModelId", default: unboundDefaultModelId },
 				requesty: { field: "requestyModelId", default: requestyDefaultModelId },
@@ -470,6 +473,15 @@ const ApiOptions = ({
 				/>
 			)}
 
+			{selectedProvider === "helicone" && (
+				<Helicone
+					apiConfiguration={apiConfiguration}
+					setApiConfigurationField={setApiConfigurationField}
+					// TODO [HELICONE]: add router models, selected model id,
+					// fromWelcomeView
+				/>
+			)}
+
 			{selectedProvider === "requesty" && (
 				<Requesty
 					uriScheme={uriScheme}
 
@@ -21,6 +21,7 @@ import {
 	fireworksModels,
 	rooModels,
 	featherlessModels,
+	heliconeModels,
 } from "@roo-code/types"
 
 export const MODELS_BY_PROVIDER: Partial<Record<ProviderName, Record<string, ModelInfo>>> = {
@@ -44,9 +45,11 @@ export const MODELS_BY_PROVIDER: Partial<Record<ProviderName, Record<string, Mod
 	fireworks: fireworksModels,
 	roo: rooModels,
 	featherless: featherlessModels,
+	helicone: heliconeModels,
 }
 
 export const PROVIDERS = [
+	{ value: "helicone", label: "Helicone" },
 	{ value: "openrouter", label: "OpenRouter" },
 	{ value: "deepinfra", label: "DeepInfra" },
 	{ value: "anthropic", label: "Anthropic" },