huggingface · SBrandeis · Feb 11, 2025 · Feb 11, 2025
@@ -125,7 +125,7 @@ for await (const output of hf.textGenerationStream({
 
 ### Text Generation (Chat Completion API Compatible)
 
-Using the `chatCompletion` method, you can generate text with models compatible with the OpenAI Chat Completion API. All models served by [TGI](https://api-inference.huggingface.co/framework/text-generation-inference) on Hugging Face support Messages API.
+Using the `chatCompletion` method, you can generate text with models compatible with the OpenAI Chat Completion API. All models served by [TGI](https://huggingface.co/docs/text-generation-inference/) on Hugging Face support Messages API.
 
 [Demo](https://huggingface.co/spaces/huggingfacejs/streaming-chat-completion)
 

@@ -1 +1,2 @@
 export const HF_HUB_URL = "https://huggingface.co";
+export const HF_ROUTER_URL = "https://router.huggingface.co";
@@ -1,4 +1,4 @@
-import { HF_HUB_URL } from "../config";
+import { HF_HUB_URL, HF_ROUTER_URL } from "../config";
 import { FAL_AI_API_BASE_URL } from "../providers/fal-ai";
 import { NEBIUS_API_BASE_URL } from "../providers/nebius";
 import { REPLICATE_API_BASE_URL } from "../providers/replicate";
@@ -11,7 +11,7 @@ import { isUrl } from "./isUrl";
 import { version as packageVersion, name as packageName } from "../../package.json";
 import { getProviderModelId } from "./getProviderModelId";
 
-const HF_HUB_INFERENCE_PROXY_TEMPLATE = `${HF_HUB_URL}/api/inference-proxy/{{PROVIDER}}`;
+const HF_HUB_INFERENCE_PROXY_TEMPLATE = `${HF_ROUTER_URL}/{{PROVIDER}}`;
 
 /**
  * Lazy-loaded from huggingface.co/api/tasks when needed

@@ -22,13 +22,14 @@ describe.concurrent("HfInference", () => {
 		"HF Inference",
 		() => {
 			const hf = new HfInference(env.HF_TOKEN);
+
 			it("throws error if model does not exist", () => {
 				expect(
 					hf.fillMask({
-						model: "this-model-does-not-exist-123",
+						model: "this-model/does-not-exist-123",
 						inputs: "[MASK] world!",
 					})
-				).rejects.toThrowError("Not Found: Model not found");
+				).rejects.toThrowError("Model this-model/does-not-exist-123 does not exist");
 			});
 
 			it("fillMask", async () => {
@@ -648,7 +649,7 @@ describe.concurrent("HfInference", () => {
 			});
 
 			it("endpoint - makes request to specified endpoint", async () => {
-				const ep = hf.endpoint("https://api-inference.huggingface.co/models/openai-community/gpt2");
+				const ep = hf.endpoint("https://router.huggingface.co/hf-inference/models/openai-community/gpt2");
 				const { generated_text } = await ep.textGeneration({
 					inputs: "one plus two equals",
 				});
@@ -686,7 +687,7 @@ describe.concurrent("HfInference", () => {
 				expect(out).toContain("2");
 			});
 
-			it("chatCompletionStream modelId Fail - OpenAI Specs", async () => {
+			it.skip("chatCompletionStream modelId Fail - OpenAI Specs", async () => {
 				expect(
 					hf
 						.chatCompletionStream({
@@ -703,7 +704,7 @@ describe.concurrent("HfInference", () => {
 			});
 
 			it("chatCompletion - OpenAI Specs", async () => {
-				const ep = hf.endpoint("https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2");
+				const ep = hf.endpoint("https://router.huggingface.co/hf-inference/models/mistralai/Mistral-7B-Instruct-v0.2");
 				const res = await ep.chatCompletion({
 					model: "tgi",
 					messages: [{ role: "user", content: "Complete the this sentence with words one plus one is equal " }],
@@ -717,7 +718,7 @@ describe.concurrent("HfInference", () => {
 				}
 			});
 			it("chatCompletionStream - OpenAI Specs", async () => {
-				const ep = hf.endpoint("https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2");
+				const ep = hf.endpoint("https://router.huggingface.co/hf-inference/models/mistralai/Mistral-7B-Instruct-v0.2");
 				const stream = ep.chatCompletionStream({
 					model: "tgi",
 					messages: [{ role: "user", content: "Complete the equation 1+1= ,just the answer" }],
Original file line number	Diff line number	Diff line change
		@@ -1 +1,2 @@
		export const HF_HUB_URL = "https://huggingface.co";
		export const HF_ROUTER_URL = "https://router.huggingface.co";