Add HF-Inference page

Wauplin · Wauplin · commit a86a44a5dda5 · 2025-04-08T18:41:38.000+02:00
diff --git a/docs/inference-providers/_toctree.yml b/docs/inference-providers/_toctree.yml
@@ -21,6 +21,8 @@
     title: Fireworks
   - local: providers/hyperbolic
     title: Hyperbolic
+  - local: providers/hf-inference
+    title: HF Inference
   - local: providers/nebius
     title: Nebius
   - local: providers/novita
diff --git a/docs/inference-providers/index.md b/docs/inference-providers/index.md
@@ -13,17 +13,18 @@ To learn more about the launch of Inference Providers, check out our [announceme
 
 Here is the complete list of partners integrated with Inference Providers, and the supported tasks for each of them:
 
-| Provider                              | Chat completion (LLM) | Chat completion (VLM) | Feature Extraction | Text to Image | Text to video |
-| ------------------------------------- | :-------------------: | :-------------------: | :----------------: | :-----------: | :-----------: |
-| [Cerebras](./providers/cerebras)      |           ✅           |                       |                    |               |               |
-| [Fal AI](./providers/fal-ai)          |                       |                       |                    |       ✅       |       ✅       |
-| [Fireworks](./providers/fireworks-ai) |           ✅           |           ✅           |                    |               |               |
-| [Hyperbolic](./providers/hyperbolic)  |           ✅           |           ✅           |                    |               |               |
-| [Nebius](./providers/nebius)          |           ✅           |           ✅           |                    |       ✅       |               |
-| [Novita](./providers/novita)          |           ✅           |           ✅           |                    |               |       ✅       |
-| [Replicate](./providers/replicate)    |                       |                       |                    |       ✅       |       ✅       |
-| [SambaNova](./providers/sambanova)    |           ✅           |                       |         ✅          |               |               |
-| [Together](./providers/together)      |           ✅           |           ✅           |                    |       ✅       |               |
+| Provider                                 | Chat completion (LLM) | Chat completion (VLM) | Feature Extraction | Text to Image | Text to video |
+| ---------------------------------------- | :-------------------: | :-------------------: | :----------------: | :-----------: | :-----------: |
+| [Cerebras](./providers/cerebras)         |           ✅           |                       |                    |               |               |
+| [Fal AI](./providers/fal-ai)             |                       |                       |                    |       ✅       |       ✅       |
+| [Fireworks](./providers/fireworks-ai)    |           ✅           |           ✅           |                    |               |               |
+| [HF Inference](./providers/hf-inference) |           ✅           |           ✅           |         ✅          |       ✅       |               |
+| [Hyperbolic](./providers/hyperbolic)     |           ✅           |           ✅           |                    |               |               |
+| [Nebius](./providers/nebius)             |           ✅           |           ✅           |                    |       ✅       |               |
+| [Novita](./providers/novita)             |           ✅           |           ✅           |                    |               |       ✅       |
+| [Replicate](./providers/replicate)       |                       |                       |                    |       ✅       |       ✅       |
+| [SambaNova](./providers/sambanova)       |           ✅           |                       |         ✅          |               |               |
+| [Together](./providers/together)         |           ✅           |           ✅           |                    |       ✅       |               |
 
 ## Why use Inference Providers?
 
diff --git a/docs/inference-providers/providers/hf-inference.md b/docs/inference-providers/providers/hf-inference.md
@@ -0,0 +1,199 @@
+<!---
+WARNING
+
+This markdown file has been generated from a script. Please do not edit it directly.
+
+If you want to update the content related to hf-inference's description, please edit the template file under `https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/providers/hf-inference.handlebars`.
+
+For more details, check out the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts.
+--->
+
+# HF Inference
+
+![https://huggingface.co/](https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo-with-title.png)
+
+HF Inference is the serverless Inference API powered by Hugging Face. This service used to be called "Inference API (serverless)" prior to Inference Providers.
+If you are interested in deploying models to a dedicated and autoscaling infrastructure managed by Hugging Face, check out [Inference Endpoints](https://huggingface.co/docs/inference-endpoints/index) instead.
+
+## Supported tasks
+
+
+### Audio Classification
+
+Find out more about Audio Classification [here](../tasks/audio_classification).
+
+<InferenceSnippet
+    pipeline=audio-classification
+    providersMapping={ {"hf-inference":{"modelId":"ehcalabres/wav2vec2-lg-xlsr-en-speech-emotion-recognition","providerModelId":"ehcalabres/wav2vec2-lg-xlsr-en-speech-emotion-recognition"} } }
+/>
+
+
+### Automatic Speech Recognition
+
+Find out more about Automatic Speech Recognition [here](../tasks/automatic_speech_recognition).
+
+<InferenceSnippet
+    pipeline=automatic-speech-recognition
+    providersMapping={ {"hf-inference":{"modelId":"openai/whisper-large-v3-turbo","providerModelId":"openai/whisper-large-v3-turbo"} } }
+/>
+
+
+### Chat Completion (LLM)
+
+Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
+
+<InferenceSnippet
+    pipeline=text-generation
+    providersMapping={ {"hf-inference":{"modelId":"Qwen/QwQ-32B","providerModelId":"Qwen/QwQ-32B"} } }
+conversational />
+
+
+### Chat Completion (VLM)
+
+Find out more about Chat Completion (VLM) [here](../tasks/chat-completion).
+
+<InferenceSnippet
+    pipeline=image-text-to-text
+    providersMapping={ {"hf-inference":{"modelId":"google/gemma-3-27b-it","providerModelId":"google/gemma-3-27b-it"} } }
+conversational />
+
+
+### Feature Extraction
+
+Find out more about Feature Extraction [here](../tasks/feature_extraction).
+
+<InferenceSnippet
+    pipeline=feature-extraction
+    providersMapping={ {"hf-inference":{"modelId":"intfloat/multilingual-e5-large-instruct","providerModelId":"intfloat/multilingual-e5-large-instruct"} } }
+/>
+
+
+### Fill Mask
+
+Find out more about Fill Mask [here](../tasks/fill_mask).
+
+<InferenceSnippet
+    pipeline=fill-mask
+    providersMapping={ {"hf-inference":{"modelId":"google-bert/bert-base-uncased","providerModelId":"google-bert/bert-base-uncased"} } }
+/>
+
+
+### Image Classification
+
+Find out more about Image Classification [here](../tasks/image_classification).
+
+<InferenceSnippet
+    pipeline=image-classification
+    providersMapping={ {"hf-inference":{"modelId":"Falconsai/nsfw_image_detection","providerModelId":"Falconsai/nsfw_image_detection"} } }
+/>
+
+
+### Image To Image
+
+Find out more about Image To Image [here](../tasks/image_to_image).
+
+<InferenceSnippet
+    pipeline=image-to-image
+    providersMapping={ {"hf-inference":{"modelId":"enhanceaiteam/Flux-Uncensored-V2","providerModelId":"black-forest-labs/FLUX.1-dev"} } }
+/>
+
+
+### Object Detection
+
+Find out more about Object Detection [here](../tasks/object_detection).
+
+<InferenceSnippet
+    pipeline=object-detection
+    providersMapping={ {"hf-inference":{"modelId":"facebook/detr-resnet-50","providerModelId":"facebook/detr-resnet-50"} } }
+/>
+
+
+### Question Answering
+
+Find out more about Question Answering [here](../tasks/question_answering).
+
+<InferenceSnippet
+    pipeline=question-answering
+    providersMapping={ {"hf-inference":{"modelId":"deepset/gelectra-large-germanquad","providerModelId":"deepset/gelectra-large-germanquad"} } }
+/>
+
+
+### Summarization
+
+Find out more about Summarization [here](../tasks/summarization).
+
+<InferenceSnippet
+    pipeline=summarization
+    providersMapping={ {"hf-inference":{"modelId":"facebook/bart-large-cnn","providerModelId":"facebook/bart-large-cnn"} } }
+/>
+
+
+### Text Classification
+
+Find out more about Text Classification [here](../tasks/text_classification).
+
+<InferenceSnippet
+    pipeline=text-classification
+    providersMapping={ {"hf-inference":{"modelId":"ProsusAI/finbert","providerModelId":"ProsusAI/finbert"} } }
+/>
+
+
+### Text Generation
+
+Find out more about Text Generation [here](../tasks/text_generation).
+
+<InferenceSnippet
+    pipeline=text-generation
+    providersMapping={ {"hf-inference":{"modelId":"Qwen/QwQ-32B","providerModelId":"Qwen/QwQ-32B"} } }
+/>
+
+
+### Text To Image
+
+Find out more about Text To Image [here](../tasks/text_to_image).
+
+<InferenceSnippet
+    pipeline=text-to-image
+    providersMapping={ {"hf-inference":{"modelId":"black-forest-labs/FLUX.1-dev","providerModelId":"black-forest-labs/FLUX.1-dev"} } }
+/>
+
+
+### Text To Video
+
+Find out more about Text To Video [here](../tasks/text_to_video).
+
+<InferenceSnippet
+    pipeline=text-to-video
+    providersMapping={ {"hf-inference":{"modelId":"AdamLucek/Wan2.1-T2V-14B-OldBookIllustrations","providerModelId":"black-forest-labs/FLUX.1-dev"} } }
+/>
+
+
+### Token Classification
+
+Find out more about Token Classification [here](../tasks/token_classification).
+
+<InferenceSnippet
+    pipeline=token-classification
+    providersMapping={ {"hf-inference":{"modelId":"dbmdz/bert-large-cased-finetuned-conll03-english","providerModelId":"dbmdz/bert-large-cased-finetuned-conll03-english"} } }
+/>
+
+
+### Translation
+
+Find out more about Translation [here](../tasks/translation).
+
+<InferenceSnippet
+    pipeline=translation
+    providersMapping={ {"hf-inference":{"modelId":"facebook/nllb-200-distilled-600M","providerModelId":"facebook/nllb-200-distilled-600M"} } }
+/>
+
+
+### Zero Shot Classification
+
+Find out more about Zero Shot Classification [here](../tasks/zero_shot_classification).
+
+<InferenceSnippet
+    pipeline=zero-shot-classification
+    providersMapping={ {"hf-inference":{"modelId":"facebook/bart-large-mnli","providerModelId":"facebook/bart-large-mnli"} } }
+/>
+
diff --git a/scripts/inference-providers/scripts/generate.ts b/scripts/inference-providers/scripts/generate.ts
@@ -736,9 +736,6 @@ await Promise.all(
 
 await Promise.all(
   Object.entries(PER_PROVIDER_TASKS).map(async ([provider, tasks]) => {
-    if (provider === "hf-inference") {
-      return;
-    }
     const rendered = await renderTemplate(provider, "providers", {
       tasksSection: PROVIDER_TASKS_TEMPLATE({ tasks }),
     });
diff --git a/scripts/inference-providers/templates/providers/hf-inference.handlebars b/scripts/inference-providers/templates/providers/hf-inference.handlebars
@@ -0,0 +1,8 @@
+# HF Inference
+
+![https://huggingface.co/](https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo-with-title.png)
+
+HF Inference is the serverless Inference API powered by Hugging Face. This service used to be called "Inference API (serverless)" prior to Inference Providers.
+If you are interested in deploying models to a dedicated and autoscaling infrastructure managed by Hugging Face, check out [Inference Endpoints](https://huggingface.co/docs/inference-endpoints/index) instead.
+
+{{{tasksSection}}}