curl snippets

julien-c · julien-c · commit aeb0731f2adc · 2025-01-23T22:17:26.000+01:00
diff --git a/packages/tasks/src/inference-providers.ts b/packages/tasks/src/inference-providers.ts
@@ -2,7 +2,7 @@ export const INFERENCE_PROVIDERS = ["hf-inference", "fal-ai", "replicate", "samb
 
 export type InferenceProvider = (typeof INFERENCE_PROVIDERS)[number];
 
-const HF_HUB_INFERENCE_PROXY_TEMPLATE = `https://huggingface.co/api/inference-proxy/{{PROVIDER}}`;
+export const HF_HUB_INFERENCE_PROXY_TEMPLATE = `https://huggingface.co/api/inference-proxy/{{PROVIDER}}`;
 
 /**
  * URL to set as baseUrl in the OpenAI SDK.
diff --git a/packages/tasks/src/snippets/curl.ts b/packages/tasks/src/snippets/curl.ts
@@ -1,30 +1,47 @@
-import type { InferenceProvider } from "../inference-providers.js";
+import { HF_HUB_INFERENCE_PROXY_TEMPLATE, type InferenceProvider } from "../inference-providers.js";
 import type { PipelineType } from "../pipelines.js";
 import type { ChatCompletionInputMessage, GenerationParameters } from "../tasks/index.js";
 import { stringifyGenerationConfig, stringifyMessages } from "./common.js";
 import { getModelInputSnippet } from "./inputs.js";
 import type { InferenceSnippet, ModelDataMinimal } from "./types.js";
 
-export const snippetBasic = (model: ModelDataMinimal, accessToken: string): InferenceSnippet => ({
-	content: `curl https://api-inference.huggingface.co/models/${model.id} \\
-	-X POST \\
-	-d '{"inputs": ${getModelInputSnippet(model, true)}}' \\
-	-H 'Content-Type: application/json' \\
-	-H 'Authorization: Bearer ${accessToken || `{API_TOKEN}`}'`,
-});
+export const snippetBasic = (
+	model: ModelDataMinimal,
+	accessToken: string,
+	provider: InferenceProvider
+): InferenceSnippet[] => {
+	if (provider !== "hf-inference") {
+		return [];
+	}
+	return [
+		{
+			content: `curl https://api-inference.huggingface.co/models/${model.id} \\
+				-X POST \\
+				-d '{"inputs": ${getModelInputSnippet(model, true)}}' \\
+				-H 'Content-Type: application/json' \\
+				-H 'Authorization: Bearer ${accessToken || `{API_TOKEN}`}'`,
+		},
+	];
+};
 
 export const snippetTextGeneration = (
 	model: ModelDataMinimal,
 	accessToken: string,
+	provider: InferenceProvider,
 	opts?: {
 		streaming?: boolean;
 		messages?: ChatCompletionInputMessage[];
 		temperature?: GenerationParameters["temperature"];
 		max_tokens?: GenerationParameters["max_tokens"];
 		top_p?: GenerationParameters["top_p"];
 	}
-): InferenceSnippet => {
+): InferenceSnippet[] => {
 	if (model.tags.includes("conversational")) {
+		const baseUrl =
+			provider === "hf-inference"
+				? `https://api-inference.huggingface.co/models/${model.id}/v1/chat/completions`
+				: HF_HUB_INFERENCE_PROXY_TEMPLATE.replace("{{PROVIDER}}", provider) + "/v1/chat/completions";
+
 		// Conversational model detected, so we display a code snippet that features the Messages API
 		const streaming = opts?.streaming ?? true;
 		const exampleMessages = getModelInputSnippet(model) as ChatCompletionInputMessage[];
@@ -35,8 +52,9 @@ export const snippetTextGeneration = (
 			max_tokens: opts?.max_tokens ?? 500,
 			...(opts?.top_p ? { top_p: opts.top_p } : undefined),
 		};
-		return {
-			content: `curl 'https://api-inference.huggingface.co/models/${model.id}/v1/chat/completions' \\
+		return [
+			{
+				content: `curl '${baseUrl}' \\
 -H 'Authorization: Bearer ${accessToken || `{API_TOKEN}`}' \\
 -H 'Content-Type: application/json' \\
 --data '{
@@ -53,31 +71,59 @@ export const snippetTextGeneration = (
 		})},
     "stream": ${!!streaming}
 }'`,
-		};
+			},
+		];
 	} else {
-		return snippetBasic(model, accessToken);
+		return snippetBasic(model, accessToken, provider);
 	}
 };
 
-export const snippetZeroShotClassification = (model: ModelDataMinimal, accessToken: string): InferenceSnippet => ({
-	content: `curl https://api-inference.huggingface.co/models/${model.id} \\
+export const snippetZeroShotClassification = (
+	model: ModelDataMinimal,
+	accessToken: string,
+	provider: InferenceProvider
+): InferenceSnippet[] => {
+	if (provider !== "hf-inference") {
+		return [];
+	}
+	return [
+		{
+			content: `curl https://api-inference.huggingface.co/models/${model.id} \\
 	-X POST \\
 	-d '{"inputs": ${getModelInputSnippet(model, true)}, "parameters": {"candidate_labels": ["refund", "legal", "faq"]}}' \\
 	-H 'Content-Type: application/json' \\
 	-H 'Authorization: Bearer ${accessToken || `{API_TOKEN}`}'`,
-});
+		},
+	];
+};
 
-export const snippetFile = (model: ModelDataMinimal, accessToken: string): InferenceSnippet => ({
-	content: `curl https://api-inference.huggingface.co/models/${model.id} \\
+export const snippetFile = (
+	model: ModelDataMinimal,
+	accessToken: string,
+	provider: InferenceProvider
+): InferenceSnippet[] => {
+	if (provider !== "hf-inference") {
+		return [];
+	}
+	return [
+		{
+			content: `curl https://api-inference.huggingface.co/models/${model.id} \\
 	-X POST \\
 	--data-binary '@${getModelInputSnippet(model, true, true)}' \\
 	-H 'Authorization: Bearer ${accessToken || `{API_TOKEN}`}'`,
-});
+		},
+	];
+};
 
 export const curlSnippets: Partial<
 	Record<
 		PipelineType,
-		(model: ModelDataMinimal, accessToken: string, opts?: Record<string, unknown>) => InferenceSnippet
+		(
+			model: ModelDataMinimal,
+			accessToken: string,
+			provider: InferenceProvider,
+			opts?: Record<string, unknown>
+		) => InferenceSnippet[]
 	>
 > = {
 	// Same order as in tasks/src/pipelines.ts
@@ -112,11 +158,9 @@ export function getCurlInferenceSnippet(
 	provider: InferenceProvider,
 	opts?: Record<string, unknown>
 ): InferenceSnippet[] {
-	const snippets =
-		model.pipeline_tag && model.pipeline_tag in curlSnippets
-			? curlSnippets[model.pipeline_tag]?.(model, accessToken, opts) ?? [{ content: "" }]
-			: [{ content: "" }];
-	return Array.isArray(snippets) ? snippets : [snippets];
+	return model.pipeline_tag && model.pipeline_tag in curlSnippets
+		? curlSnippets[model.pipeline_tag]?.(model, accessToken, provider, opts) ?? []
+		: [];
 }
 
 export function hasCurlInferenceSnippet(model: Pick<ModelDataMinimal, "pipeline_tag">): boolean {
diff --git a/packages/tasks/src/snippets/js.ts b/packages/tasks/src/snippets/js.ts
@@ -1,4 +1,4 @@
-import { HF_HUB_INFERENCE_PROXY_TEMPLATE, openAIbaseUrl, type InferenceProvider } from "../inference-providers.js";
+import { openAIbaseUrl, type InferenceProvider } from "../inference-providers.js";
 import type { PipelineType } from "../pipelines.js";
 import type { ChatCompletionInputMessage, GenerationParameters } from "../tasks/index.js";
 import { stringifyGenerationConfig, stringifyMessages } from "./common.js";

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-import { HF_HUB_INFERENCE_PROXY_TEMPLATE, openAIbaseUrl, type InferenceProvider } from "../inference-providers.js";`
	`1`	`+import { openAIbaseUrl, type InferenceProvider } from "../inference-providers.js";`
`2`	`2`	`import type { PipelineType } from "../pipelines.js";`
`3`	`3`	`import type { ChatCompletionInputMessage, GenerationParameters } from "../tasks/index.js";`
`4`	`4`	`import { stringifyGenerationConfig, stringifyMessages } from "./common.js";`