openai client compat

julien-c · julien-c · commit 8aafe2562642 · 2025-01-23T21:45:59.000+01:00
diff --git a/packages/tasks/src/inference-providers.ts b/packages/tasks/src/inference-providers.ts
@@ -1,3 +1,5 @@
 export const INFERENCE_PROVIDERS = ["hf-inference", "fal-ai", "replicate", "sambanova", "together"] as const;
 
 export type InferenceProvider = (typeof INFERENCE_PROVIDERS)[number];
+
+export const HF_HUB_INFERENCE_PROXY_TEMPLATE = `https://huggingface.co/api/inference-proxy/{{PROVIDER}}`;
diff --git a/packages/tasks/src/snippets/curl.ts b/packages/tasks/src/snippets/curl.ts
@@ -1,3 +1,4 @@
+import type { InferenceProvider } from "../inference-providers.js";
 import type { PipelineType } from "../pipelines.js";
 import type { ChatCompletionInputMessage, GenerationParameters } from "../tasks/index.js";
 import { stringifyGenerationConfig, stringifyMessages } from "./common.js";
@@ -79,7 +80,7 @@ export const curlSnippets: Partial<
 		(model: ModelDataMinimal, accessToken: string, opts?: Record<string, unknown>) => InferenceSnippet
 	>
 > = {
-	// Same order as in js/src/lib/interfaces/Types.ts
+	// Same order as in tasks/src/pipelines.ts
 	"text-classification": snippetBasic,
 	"token-classification": snippetBasic,
 	"table-question-answering": snippetBasic,
@@ -108,11 +109,14 @@ export const curlSnippets: Partial<
 export function getCurlInferenceSnippet(
 	model: ModelDataMinimal,
 	accessToken: string,
+	provider: InferenceProvider,
 	opts?: Record<string, unknown>
-): InferenceSnippet {
-	return model.pipeline_tag && model.pipeline_tag in curlSnippets
-		? curlSnippets[model.pipeline_tag]?.(model, accessToken, opts) ?? { content: "" }
-		: { content: "" };
+): InferenceSnippet[] {
+	const snippets =
+		model.pipeline_tag && model.pipeline_tag in curlSnippets
+			? curlSnippets[model.pipeline_tag]?.(model, accessToken, opts) ?? [{ content: "" }]
+			: [{ content: "" }];
+	return Array.isArray(snippets) ? snippets : [snippets];
 }
 
 export function hasCurlInferenceSnippet(model: Pick<ModelDataMinimal, "pipeline_tag">): boolean {
diff --git a/packages/tasks/src/snippets/js.ts b/packages/tasks/src/snippets/js.ts
@@ -1,4 +1,4 @@
-import type { InferenceProvider } from "../inference-providers.js";
+import { HF_HUB_INFERENCE_PROXY_TEMPLATE, type InferenceProvider } from "../inference-providers.js";
 import type { PipelineType } from "../pipelines.js";
 import type { ChatCompletionInputMessage, GenerationParameters } from "../tasks/index.js";
 import { stringifyGenerationConfig, stringifyMessages } from "./common.js";
@@ -51,6 +51,11 @@ export const snippetTextGeneration = (
 		top_p?: GenerationParameters["top_p"];
 	}
 ): InferenceSnippet[] => {
+	const openAIbaseUrl =
+		provider === "hf-inference"
+			? "https://api-inference.huggingface.co/v1/"
+			: HF_HUB_INFERENCE_PROXY_TEMPLATE.replace("{{PROVIDER}}", provider);
+
 	if (model.tags.includes("conversational")) {
 		// Conversational model detected, so we display a code snippet that features the Messages API
 		const streaming = opts?.streaming ?? true;
@@ -93,15 +98,13 @@ for await (const chunk of stream) {
 	}  
 }`,
 				},
-				...(provider === "hf-inference"
-					? [
-						{
-							client: "openai",
-							content: `import { OpenAI } from "openai";
+				{
+					client: "openai",
+					content: `import { OpenAI } from "openai";
 
 const client = new OpenAI({
-	baseURL: "https://api-inference.huggingface.co/v1/",
-    apiKey: "${accessToken || `{API_TOKEN}`}"
+	baseURL: "${openAIbaseUrl}",
+	apiKey: "${accessToken || `{API_TOKEN}`}"
 });
 
 let out = "";
@@ -120,9 +123,7 @@ for await (const chunk of stream) {
 		console.log(newContent);
 	}  
 }`,
-						},
-					]
-					: []),
+				},
 			];
 		} else {
 			return [
@@ -141,15 +142,13 @@ const chatCompletion = await client.chatCompletion({
 
 console.log(chatCompletion.choices[0].message);`,
 				},
-				...(provider === "hf-inference"
-					? [
-						{
-							client: "openai",
-							content: `import { OpenAI } from "openai";
+				{
+					client: "openai",
+					content: `import { OpenAI } from "openai";
 
 const client = new OpenAI({
-    baseURL: "https://api-inference.huggingface.co/v1/",
-    apiKey: "${accessToken || `{API_TOKEN}`}"
+	baseURL: "${openAIbaseUrl}",
+	apiKey: "${accessToken || `{API_TOKEN}`}"
 });
 
 const chatCompletion = await client.chat.completions.create({
@@ -159,9 +158,7 @@ const chatCompletion = await client.chat.completions.create({
 });
 
 console.log(chatCompletion.choices[0].message);`,
-						},
-					]
-					: []),
+				},
 			];
 		}
 	} else {
@@ -227,9 +224,9 @@ infer(${getModelInputSnippet(model)}, { num_inference_steps: 5 }).then((image) =
 		},
 		...(provider === "hf-inference"
 			? [
-				{
-					client: "fetch",
-					content: `async function query(data) {
+					{
+						client: "fetch",
+						content: `async function query(data) {
 	const response = await fetch(
 		"https://api-inference.huggingface.co/models/${model.id}",
 		{
@@ -247,8 +244,8 @@ infer(${getModelInputSnippet(model)}, { num_inference_steps: 5 }).then((image) =
 query({"inputs": ${getModelInputSnippet(model)}}).then((response) => {
 	// Use image
 });`,
-				},
-			]
+					},
+			  ]
 			: []),
 	];
 };
@@ -385,7 +382,7 @@ export const jsSnippets: Partial<
 		) => InferenceSnippet[]
 	>
 > = {
-	// Same order as in src/pipelines.ts
+	// Same order as in tasks/src/pipelines.ts
 	"text-classification": snippetBasic,
 	"token-classification": snippetBasic,
 	"table-question-answering": snippetBasic,
diff --git a/packages/tasks/src/snippets/python.ts b/packages/tasks/src/snippets/python.ts
@@ -1,3 +1,4 @@
+import type { InferenceProvider } from "../inference-providers.js";
 import type { PipelineType } from "../pipelines.js";
 import type { ChatCompletionInputMessage, GenerationParameters } from "../tasks/index.js";
 import { stringifyGenerationConfig, stringifyMessages } from "./common.js";
@@ -287,16 +288,17 @@ export const pythonSnippets: Partial<
 export function getPythonInferenceSnippet(
 	model: ModelDataMinimal,
 	accessToken: string,
+	provider: InferenceProvider,
 	opts?: Record<string, unknown>
-): InferenceSnippet | InferenceSnippet[] {
+): InferenceSnippet[] {
 	if (model.tags.includes("conversational")) {
 		// Conversational model detected, so we display a code snippet that features the Messages API
 		return snippetConversational(model, accessToken, opts);
 	} else {
 		let snippets =
 			model.pipeline_tag && model.pipeline_tag in pythonSnippets
-				? pythonSnippets[model.pipeline_tag]?.(model, accessToken) ?? { content: "" }
-				: { content: "" };
+				? pythonSnippets[model.pipeline_tag]?.(model, accessToken) ?? [{ content: "" }]
+				: [{ content: "" }];
 
 		snippets = Array.isArray(snippets) ? snippets : [snippets];