gokayfem
diff --git a/‎packages/inference/src/index.ts‎
Lines changed: 4 additions & 0 deletions b/‎packages/inference/src/index.ts‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎packages/inference/src/lib/makeRequestOptions.ts‎
Lines changed: 24 additions & 14 deletions b/‎packages/inference/src/lib/makeRequestOptions.ts‎
Lines changed: 24 additions & 14 deletions
diff --git a/‎packages/inference/src/providers/fal-ai.ts‎
Lines changed: 70 additions & 70 deletions b/‎packages/inference/src/providers/fal-ai.ts‎
Lines changed: 70 additions & 70 deletions
diff --git a/‎packages/inference/src/providers/replicate.ts‎
Lines changed: 10 additions & 16 deletions b/‎packages/inference/src/providers/replicate.ts‎
Lines changed: 10 additions & 16 deletions
diff --git a/‎packages/inference/src/providers/sambanova.ts‎
Lines changed: 16 additions & 25 deletions b/‎packages/inference/src/providers/sambanova.ts‎
Lines changed: 16 additions & 25 deletions
@@ -1,4 +1,8 @@
 export { HfInference, HfInferenceEndpoint } from "./HfInference";
 export { InferenceOutputError } from "./lib/InferenceOutputError";
+export { FAL_AI_SUPPORTED_MODEL_IDS } from "./providers/fal-ai";
+export { REPLICATE_SUPPORTED_MODEL_IDS } from "./providers/replicate";
+export { SAMBANOVA_SUPPORTED_MODEL_IDS } from "./providers/sambanova";
+export { TOGETHER_SUPPORTED_MODEL_IDS } from "./providers/together";
 export * from "./types";
 export * from "./tasks";
@@ -1,8 +1,8 @@
 import { HF_HUB_URL, HF_INFERENCE_API_URL } from "../config";
-import { FAL_AI_API_BASE_URL, FAL_AI_MODEL_IDS } from "../providers/fal-ai";
-import { REPLICATE_API_BASE_URL, REPLICATE_MODEL_IDS } from "../providers/replicate";
-import { SAMBANOVA_API_BASE_URL, SAMBANOVA_MODEL_IDS } from "../providers/sambanova";
-import { TOGETHER_API_BASE_URL, TOGETHER_MODEL_IDS } from "../providers/together";
+import { FAL_AI_API_BASE_URL, FAL_AI_SUPPORTED_MODEL_IDS } from "../providers/fal-ai";
+import { REPLICATE_API_BASE_URL, REPLICATE_SUPPORTED_MODEL_IDS } from "../providers/replicate";
+import { SAMBANOVA_API_BASE_URL, SAMBANOVA_SUPPORTED_MODEL_IDS } from "../providers/sambanova";
+import { TOGETHER_API_BASE_URL, TOGETHER_SUPPORTED_MODEL_IDS } from "../providers/together";
 import type { InferenceProvider } from "../types";
 import type { InferenceTask, Options, RequestArgs } from "../types";
 import { isUrl } from "./isUrl";
@@ -50,13 +50,13 @@ export async function makeRequestOptions(
 	let model: string;
 	if (!maybeModel) {
 		if (taskHint) {
-			model = mapModel({ model: await loadDefaultModel(taskHint), provider });
+			model = mapModel({ model: await loadDefaultModel(taskHint), provider, taskHint, chatCompletion });
 		} else {
 			throw new Error("No model provided, and no default model found for this task");
 			/// TODO : change error message ^
 		}
 	} else {
-		model = mapModel({ model: maybeModel, provider });
+		model = mapModel({ model: maybeModel, provider, taskHint, chatCompletion });
 	}
 
 	/// If accessToken is passed, it should take precedence over includeCredentials
@@ -143,24 +143,34 @@ export async function makeRequestOptions(
 	return { url, info };
 }
 
-function mapModel(params: { model: string; provider: InferenceProvider }): string {
+function mapModel(params: {
+	model: string;
+	provider: InferenceProvider;
+	taskHint: InferenceTask | undefined;
+	chatCompletion: boolean | undefined;
+}): string {
+	if (params.provider === "hf-inference") {
+		return params.model;
+	}
+	if (!params.taskHint) {
+		throw new Error("taskHint must be specified when using a third-party provider");
+	}
+	const task = params.taskHint === "text-generation" && params.chatCompletion ? "conversational" : params.taskHint;
 	const model = (() => {
 		switch (params.provider) {
 			case "fal-ai":
-				return FAL_AI_MODEL_IDS[params.model];
+				return FAL_AI_SUPPORTED_MODEL_IDS[task]?.[params.model];
 			case "replicate":
-				return REPLICATE_MODEL_IDS[params.model];
+				return REPLICATE_SUPPORTED_MODEL_IDS[task]?.[params.model];
 			case "sambanova":
-				return SAMBANOVA_MODEL_IDS[params.model];
+				return SAMBANOVA_SUPPORTED_MODEL_IDS[task]?.[params.model];
 			case "together":
-				return TOGETHER_MODEL_IDS[params.model]?.id;
-			case "hf-inference":
-				return params.model;
+				return TOGETHER_SUPPORTED_MODEL_IDS[task]?.[params.model];
 		}
 	})();
 
 	if (!model) {
-		throw new Error(`Model ${params.model} is not supported for provider ${params.provider}`);
+		throw new Error(`Model ${params.model} is not supported for task ${task} and provider ${params.provider}`);
 	}
 	return model;
 }
 
@@ -1,76 +1,76 @@
-import type { ModelId } from "../types";
+import { ModelId } from "../types";
+import type { ProviderMapping } from "./types";
 
 export const FAL_AI_API_BASE_URL = "https://fal.run";
 
 type FalAiId = string;
 
-/**
- * Mapping from HF model ID -> fal.ai app id
- */
-export const FAL_AI_MODEL_IDS: Record<ModelId, FalAiId> = {
-    /** text-to-image */
-    "black-forest-labs/FLUX.1-schnell": "fal-ai/flux/schnell",
-    "black-forest-labs/FLUX.1-dev": "fal-ai/flux/dev",
-    "black-forest-labs/FLUX.1-Depth-dev": "fal-ai/flux-lora-depth",
-    "black-forest-labs/FLUX.1-Canny-dev": "fal-ai/flux-lora-canny",
-    "black-forest-labs/FLUX.1-Redux-dev": "fal-ai/flux/dev/redux",
-    "playgroundai/playground-v2.5-1024px-aesthetic": "fal-ai/playground-v25",
-    "ByteDance/SDXL-Lightning": "fal-ai/lightning-models",
-    "PixArt-alpha/PixArt-Sigma-XL-2-1024-MS": "fal-ai/pixart-sigma",
-    "stabilityai/stable-diffusion-3-medium": "fal-ai/stable-diffusion-v3-medium",
-    "Warlord-K/Sana-1024": "fal-ai/sana",
-    "fal/AuraFlow-v0.2": "fal-ai/aura-flow",
-    "stabilityai/stable-diffusion-3.5-large": "fal-ai/stable-diffusion-v35-large",
-    "yresearch/Switti": "fal-ai/switti",
-    "guozinan/PuLID": "fal-ai/flux-pulid",
-    "lllyasviel/ic-light": "fal-ai/iclight-v2",
-    "stabilityai/stable-diffusion-xl-base-1.0": "fal-ai/lora",
-    "Kwai-Kolors/Kolors": "fal-ai/kolors",
-
-    /** image-to-image */
-    "Yuanshi/OminiControl": "fal-ai/flux-subject",
-    "fal/AuraSR-v2": "fal-ai/aura-sr",
-    "franciszzj/Leffa": "fal-ai/leffa",
-    "ai-forever/Real-ESRGAN": "fal-ai/esrgan",
-
-    /** image-segmentation */
-    "briaai/RMBG-2.0": "fal-ai/bria/background/remove",
-    "ZhengPeng7/BiRefNet": "fal-ai/birefnet/v2",
-
-    /** text-to-video */
-    "genmo/mochi-1-preview": "fal-ai/mochi-v1",
-    "THUDM/CogVideoX-5b": "fal-ai/cogvideox-5b",
-    "Lightricks/LTX-Video": "fal-ai/ltx-video",
-    "tencent/HunyuanVideo": "fal-ai/hunyuan-video",
-    "wileewang/TransPixar": "fal-ai/transpixar",
-
-    /** image-to-video */
-    "stabilityai/stable-video-1.0": "fal-ai/stable-video",
-    "KwaiVGI/LivePortrait": "fal-ai/live-portrait",
-
-    /** text-to-audio */
-    "hkchengrex/MMAudio": "fal-ai/mmaudio-v2",
-    "stabilityai/stable-audio-open-1.0": "fal-ai/stable-audio",
-
-    /** text-to-speech */
-    "SWivid/F5-TTS": "fal-ai/f5-tts",
-
-    /** image-text-to-text */
-    "vikhyatk/moondream-next": "fal-ai/moondream-next",
-    "microsoft/Florence-2-large": "fal-ai/florence-2-large/caption",
-    "ByteDance/Sa2VA-8B": "fal-ai/sa2va/8b/image/playground",
-
-    /** mask-generation */
-    "facebook/sam2-hiera-large": "fal-ai/sam2",
-
-    /** image-to-3d */
-    "JeffreyXiang/TRELLIS-image-large": "fal-ai/trellis",
-
-    /** depth-estimation */
-    "Intel/dpt-hybrid-midas": "fal-ai/imageutils/depth",
-    "prs-eth/marigold-depth-v1-0": "fal-ai/imageutils/marigold-depth",
-    "depth-anything/Depth-Anything-V2-Large": "fal-ai/image-preprocessors/depth-anything/v2",
-
-    /** automatic-speech-recognition */
-    "openai/whisper-large-v3": "fal-ai/whisper",
+export const FAL_AI_SUPPORTED_MODEL_IDS: ProviderMapping<FalAiId> = {
+    "text-to-image": {
+        "black-forest-labs/FLUX.1-schnell": "fal-ai/flux/schnell",
+        "black-forest-labs/FLUX.1-dev": "fal-ai/flux/dev",
+        "black-forest-labs/FLUX.1-Depth-dev": "fal-ai/flux-lora-depth",
+        "black-forest-labs/FLUX.1-Canny-dev": "fal-ai/flux-lora-canny",
+        "black-forest-labs/FLUX.1-Fill-dev": "fal-ai/flux-lora-fill",
+        "black-forest-labs/FLUX.1-Redux-dev": "fal-ai/flux/dev/redux",
+        "playgroundai/playground-v2.5-1024px-aesthetic": "fal-ai/playground-v25",
+        "ByteDance/SDXL-Lightning": "fal-ai/lightning-models",
+        "PixArt-alpha/PixArt-Sigma-XL-2-1024-MS": "fal-ai/pixart-sigma",
+        "stabilityai/stable-diffusion-3-medium": "fal-ai/stable-diffusion-v3-medium",
+        "Warlord-K/Sana-1024": "fal-ai/sana",
+        "fal/AuraFlow-v0.2": "fal-ai/aura-flow",
+        "stabilityai/stable-diffusion-3.5-large": "fal-ai/stable-diffusion-v35-large",
+        "yresearch/Switti": "fal-ai/switti",
+        "guozinan/PuLID": "fal-ai/flux-pulid",
+        "lllyasviel/ic-light": "fal-ai/iclight-v2",
+        "stabilityai/stable-diffusion-xl-base-1.0": "fal-ai/lora",
+        "Kwai-Kolors/Kolors": "fal-ai/kolors"
+    },
+    "image-to-image": {
+        "Yuanshi/OminiControl": "fal-ai/flux-subject",
+        "fal/AuraSR-v2": "fal-ai/aura-sr",
+        "franciszzj/Leffa": "fal-ai/leffa",
+        "ai-forever/Real-ESRGAN": "fal-ai/esrgan"
+    },
+    "image-segmentation": {
+        "briaai/RMBG-2.0": "fal-ai/bria/background/remove",
+        "ZhengPeng7/BiRefNet": "fal-ai/birefnet/v2"
+    },
+    "text-to-video": {
+        "genmo/mochi-1-preview": "fal-ai/mochi-v1",
+        "THUDM/CogVideoX-5b": "fal-ai/cogvideox-5b",
+        "Lightricks/LTX-Video": "fal-ai/ltx-video",
+        "tencent/HunyuanVideo": "fal-ai/hunyuan-video",
+        "wileewang/TransPixar": "fal-ai/transpixar"
+    },
+    "image-to-video": {
+        "stabilityai/stable-video-1.0": "fal-ai/stable-video",
+        "KwaiVGI/LivePortrait": "fal-ai/live-portrait"
+    },
+    "text-to-audio": {
+        "hkchengrex/MMAudio": "fal-ai/mmaudio-v2",
+        "stabilityai/stable-audio-open-1.0": "fal-ai/stable-audio"
+    },
+    "text-to-speech": {
+        "SWivid/F5-TTS": "fal-ai/f5-tts"
+    },
+    "image-text-to-text": {
+        "vikhyatk/moondream-next": "fal-ai/moondream-next",
+        "microsoft/Florence-2-large": "fal-ai/florence-2-large/caption",
+        "ByteDance/Sa2VA-8B": "fal-ai/sa2va/8b/image/playground"
+    },
+    "mask-generation": {
+        "facebook/sam2-hiera-large": "fal-ai/sam2"
+    },
+    "image-to-3d": {
+        "JeffreyXiang/TRELLIS-image-large": "fal-ai/trellis"
+    },
+    "depth-estimation": {
+        "Intel/dpt-hybrid-midas": "fal-ai/imageutils/depth",
+        "prs-eth/marigold-depth-v1-0": "fal-ai/imageutils/marigold-depth",
+        "depth-anything/Depth-Anything-V2-Large": "fal-ai/image-preprocessors/depth-anything/v2"
+    },
+    "automatic-speech-recognition": {
+        "openai/whisper-large-v3": "fal-ai/whisper"
+    }
 };
@@ -1,22 +1,16 @@
-import type { ModelId } from "../types";
+import type { ProviderMapping } from "./types";
 
 export const REPLICATE_API_BASE_URL = "https://api.replicate.com";
 
 type ReplicateId = string;
 
-/**
- * Mapping from HF model ID -> Replicate model ID
- *
- * Available models can be fetched with:
- * ```
- * curl -s \
- * 	-H "Authorization: Bearer $REPLICATE_API_TOKEN" \
- * 	'https://api.replicate.com/v1/models'
- * ```
- */
-export const REPLICATE_MODEL_IDS: Partial<Record<ModelId, ReplicateId>> = {
-	/** text-to-image */
-	"black-forest-labs/FLUX.1-schnell": "black-forest-labs/flux-schnell",
-	"ByteDance/SDXL-Lightning":
-		"bytedance/sdxl-lightning-4step:5599ed30703defd1d160a25a63321b4dec97101d98b4674bcc56e41f62f35637",
+export const REPLICATE_SUPPORTED_MODEL_IDS: ProviderMapping<ReplicateId> = {
+	"text-to-image": {
+		"black-forest-labs/FLUX.1-schnell": "black-forest-labs/flux-schnell",
+		"ByteDance/SDXL-Lightning":
+			"bytedance/sdxl-lightning-4step:5599ed30703defd1d160a25a63321b4dec97101d98b4674bcc56e41f62f35637",
+	},
+	// "text-to-speech": {
+	// 	"SWivid/F5-TTS": "x-lance/f5-tts:87faf6dd7a692dd82043f662e76369cab126a2cf1937e25a9d41e0b834fd230e"
+	// },
 };
@@ -1,32 +1,23 @@
-import type { ModelId } from "../types";
+import type { ProviderMapping } from "./types";
 
 export const SAMBANOVA_API_BASE_URL = "https://api.sambanova.ai";
 
-/**
- * Note for reviewers: our goal would be to ask Sambanova to support
- * our model ids too, so we don't have to define a mapping
- * or keep it up-to-date.
- *
- * As a fallback, if the above is not possible, ask Sambanova to
- * provide the mapping as an fetchable API.
- */
 type SambanovaId = string;
 
-/**
- * https://community.sambanova.ai/t/supported-models/193
- */
-export const SAMBANOVA_MODEL_IDS: Partial<Record<ModelId, SambanovaId>> = {
+export const SAMBANOVA_SUPPORTED_MODEL_IDS: ProviderMapping<SambanovaId> = {
 	/** Chat completion / conversational */
-	"Qwen/Qwen2.5-Coder-32B-Instruct": "Qwen2.5-Coder-32B-Instruct",
-	"Qwen/Qwen2.5-72B-Instruct": "Qwen2.5-72B-Instruct",
-	"Qwen/QwQ-32B-Preview": "QwQ-32B-Preview",
-	"meta-llama/Llama-3.3-70B-Instruct": "Meta-Llama-3.3-70B-Instruct",
-	"meta-llama/Llama-3.2-1B": "Meta-Llama-3.2-1B-Instruct",
-	"meta-llama/Llama-3.2-3B": "Meta-Llama-3.2-3B-Instruct",
-	"meta-llama/Llama-3.2-11B-Vision-Instruct": "Llama-3.2-11B-Vision-Instruct",
-	"meta-llama/Llama-3.2-90B-Vision-Instruct": "Llama-3.2-90B-Vision-Instruct",
-	"meta-llama/Llama-3.1-8B-Instruct": "Meta-Llama-3.1-8B-Instruct",
-	"meta-llama/Llama-3.1-70B-Instruct": "Meta-Llama-3.1-70B-Instruct",
-	"meta-llama/Llama-3.1-405B-Instruct": "Meta-Llama-3.1-405B-Instruct",
-	"meta-llama/Llama-Guard-3-8B": "Meta-Llama-Guard-3-8B",
+	conversational: {
+		"Qwen/Qwen2.5-Coder-32B-Instruct": "Qwen2.5-Coder-32B-Instruct",
+		"Qwen/Qwen2.5-72B-Instruct": "Qwen2.5-72B-Instruct",
+		"Qwen/QwQ-32B-Preview": "QwQ-32B-Preview",
+		"meta-llama/Llama-3.3-70B-Instruct": "Meta-Llama-3.3-70B-Instruct",
+		"meta-llama/Llama-3.2-1B-Instruct": "Meta-Llama-3.2-1B-Instruct",
+		"meta-llama/Llama-3.2-3B-Instruct": "Meta-Llama-3.2-3B-Instruct",
+		"meta-llama/Llama-3.2-11B-Vision-Instruct": "Llama-3.2-11B-Vision-Instruct",
+		"meta-llama/Llama-3.2-90B-Vision-Instruct": "Llama-3.2-90B-Vision-Instruct",
+		"meta-llama/Llama-3.1-8B-Instruct": "Meta-Llama-3.1-8B-Instruct",
+		"meta-llama/Llama-3.1-70B-Instruct": "Meta-Llama-3.1-70B-Instruct",
+		"meta-llama/Llama-3.1-405B-Instruct": "Meta-Llama-3.1-405B-Instruct",
+		"meta-llama/Llama-Guard-3-8B": "Meta-Llama-Guard-3-8B",
+	},
 };