huggingface
diff --git a/‎docs/source/en/guides/inference.md
Lines changed: 30 additions & 30 deletions b/‎docs/source/en/guides/inference.md
Lines changed: 30 additions & 30 deletions
diff --git a/‎src/huggingface_hub/inference/_client.py
Lines changed: 1 addition & 1 deletion b/‎src/huggingface_hub/inference/_client.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/huggingface_hub/inference/_generated/_async_client.py
Lines changed: 1 addition & 1 deletion b/‎src/huggingface_hub/inference/_generated/_async_client.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/huggingface_hub/inference/_providers/__init__.py
Lines changed: 10 additions & 3 deletions b/‎src/huggingface_hub/inference/_providers/__init__.py
Lines changed: 10 additions & 3 deletions
diff --git a/‎src/huggingface_hub/inference/_providers/_common.py
Lines changed: 33 additions & 0 deletions b/‎src/huggingface_hub/inference/_providers/_common.py
Lines changed: 33 additions & 0 deletions
diff --git a/‎src/huggingface_hub/inference/_providers/fireworks_ai.py
Lines changed: 3 additions & 11 deletions b/‎src/huggingface_hub/inference/_providers/fireworks_ai.py
Lines changed: 3 additions & 11 deletions
diff --git a/‎src/huggingface_hub/inference/_providers/hyperbolic.py
Lines changed: 43 additions & 0 deletions b/‎src/huggingface_hub/inference/_providers/hyperbolic.py
Lines changed: 43 additions & 0 deletions
diff --git a/‎src/huggingface_hub/inference/_providers/new_provider.md
Lines changed: 2 additions & 0 deletions b/‎src/huggingface_hub/inference/_providers/new_provider.md
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/huggingface_hub/inference/_providers/sambanova.py
Lines changed: 3 additions & 11 deletions b/‎src/huggingface_hub/inference/_providers/sambanova.py
Lines changed: 3 additions & 11 deletions
@@ -248,36 +248,36 @@ You might wonder why using [`InferenceClient`] instead of OpenAI's client? There
 
 [`InferenceClient`]'s goal is to provide the easiest interface to run inference on Hugging Face models, on any provider. It has a simple API that supports the most common tasks. Here is a table showing which providers support which tasks:
 
-| Domain              | Task                                                | HF Inference | Replicate | fal-ai | Fireworks AI | Sambanova | Together |
-| ------------------- | --------------------------------------------------- | ------------ | --------- | ------ | ------------ | --------- | -------- |
-| **Audio**           | [`~InferenceClient.audio_classification`]           | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.audio_to_audio`]                 | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.automatic_speech_recognition`]   | ✅            | ❌         | ✅      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.text_to_speech`]                 | ✅            | ✅         | ❌      | ❌            | ❌         | ❌        |
-| **Computer Vision** | [`~InferenceClient.image_classification`]           | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.image_segmentation`]             | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.image_to_image`]                 | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.image_to_text`]                  | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.object_detection`]               | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.text_to_image`]                  | ✅            | ✅         | ✅      | ❌            | ❌         | ✅        |
-|                     | [`~InferenceClient.text_to_video`]                  | ❌            | ✅         | ✅      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.zero_shot_image_classification`] | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-| **Multimodal**      | [`~InferenceClient.document_question_answering`]    | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.visual_question_answering`]      | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-| **NLP**             | [`~InferenceClient.chat_completion`]                | ✅            | ❌         | ❌      | ✅            | ✅         | ✅        |
-|                     | [`~InferenceClient.feature_extraction`]             | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.fill_mask`]                      | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.question_answering`]             | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.sentence_similarity`]            | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.summarization`]                  | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.table_question_answering`]       | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.text_classification`]            | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.text_generation`]                | ✅            | ❌         | ❌      | ❌            | ❌         | ✅        |
-|                     | [`~InferenceClient.token_classification`]           | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.translation`]                    | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.zero_shot_classification`]       | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-| **Tabular**         | [`~InferenceClient.tabular_classification`]         | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
-|                     | [`~InferenceClient.tabular_regression`]             | ✅            | ❌         | ❌      | ❌            | ❌         | ❌        |
+| Domain              | Task                                                | HF Inference | fal-ai | Fireworks AI | Hyperbolic | Replicate | Sambanova | Together |
+| ------------------- | --------------------------------------------------- | ------------ | ------ | ------------ | ---------- | --------- | --------- | -------- |
+| **Audio**           | [`~InferenceClient.audio_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.audio_to_audio`]                 | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.automatic_speech_recognition`]   | ✅            | ✅      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_to_speech`]                 | ✅            | ❌      | ❌            | ❌          | ✅         | ❌         | ❌        |
+| **Computer Vision** | [`~InferenceClient.image_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.image_segmentation`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.image_to_image`]                 | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.image_to_text`]                  | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.object_detection`]               | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_to_image`]                  | ✅            | ✅      | ❌            | ✅          | ✅         | ❌         | ✅        |
+|                     | [`~InferenceClient.text_to_video`]                  | ❌            | ✅      | ❌            | ❌          | ✅         | ❌         | ❌        |
+|                     | [`~InferenceClient.zero_shot_image_classification`] | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+| **Multimodal**      | [`~InferenceClient.document_question_answering`]    | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.visual_question_answering`]      | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+| **NLP**             | [`~InferenceClient.chat_completion`]                | ✅            | ❌      | ✅            | ✅          | ❌         | ✅         | ✅        |
+|                     | [`~InferenceClient.feature_extraction`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.fill_mask`]                      | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.question_answering`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.sentence_similarity`]            | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.summarization`]                  | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.table_question_answering`]       | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_classification`]            | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_generation`]                | ✅            | ❌      | ❌            | ✅          | ❌         | ❌         | ✅        |
+|                     | [`~InferenceClient.token_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.translation`]                    | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.zero_shot_classification`]       | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+| **Tabular**         | [`~InferenceClient.tabular_classification`]         | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.tabular_regression`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
 
 <Tip>
 
 
@@ -132,7 +132,7 @@ class InferenceClient:
             path will be appended to the base URL (see the [TGI Messages API](https://huggingface.co/docs/text-generation-inference/en/messages_api)
             documentation for details). When passing a URL as `model`, the client will not append any suffix path to it.
         provider (`str`, *optional*):
-            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"replicate"`, "sambanova"`, `"together"`, or `"hf-inference"`.
+            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"hf-inference"`, `"hyperbolic"`, `"replicate"`, "sambanova"` or `"together"`.
             defaults to hf-inference (Hugging Face Serverless Inference API).
             If model is a URL or `base_url` is passed, then `provider` is not used.
         token (`str` or `bool`, *optional*):
 
@@ -120,7 +120,7 @@ class AsyncInferenceClient:
             path will be appended to the base URL (see the [TGI Messages API](https://huggingface.co/docs/text-generation-inference/en/messages_api)
             documentation for details). When passing a URL as `model`, the client will not append any suffix path to it.
         provider (`str`, *optional*):
-            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"replicate"`, "sambanova"`, `"together"`, or `"hf-inference"`.
+            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"hf-inference"`, `"hyperbolic"`, `"replicate"`, "sambanova"` or `"together"`.
             defaults to hf-inference (Hugging Face Serverless Inference API).
             If model is a URL or `base_url` is passed, then `provider` is not used.
         token (`str` or `bool`, *optional*):
 
@@ -9,15 +9,17 @@
 )
 from .fireworks_ai import FireworksAIConversationalTask
 from .hf_inference import HFInferenceBinaryInputTask, HFInferenceConversational, HFInferenceTask
+from .hyperbolic import HyperbolicTextGenerationTask, HyperbolicTextToImageTask
 from .replicate import ReplicateTask, ReplicateTextToSpeechTask
 from .sambanova import SambanovaConversationalTask
-from .together import TogetherTextGenerationTask, TogetherTextToImageTask
+from .together import TogetherConversationalTask, TogetherTextGenerationTask, TogetherTextToImageTask
 
 
 PROVIDER_T = Literal[
     "fal-ai",
     "fireworks-ai",
     "hf-inference",
+    "hyperbolic",
     "replicate",
     "sambanova",
     "together",
@@ -61,6 +63,11 @@
         "summarization": HFInferenceTask("summarization"),
         "visual-question-answering": HFInferenceBinaryInputTask("visual-question-answering"),
     },
+    "hyperbolic": {
+        "text-to-image": HyperbolicTextToImageTask(),
+        "conversational": HyperbolicTextGenerationTask("conversational"),
+        "text-generation": HyperbolicTextGenerationTask("text-generation"),
+    },
     "replicate": {
         "text-to-image": ReplicateTask("text-to-image"),
         "text-to-speech": ReplicateTextToSpeechTask(),
@@ -71,8 +78,8 @@
     },
     "together": {
         "text-to-image": TogetherTextToImageTask(),
-        "conversational": TogetherTextGenerationTask("conversational"),
-        "text-generation": TogetherTextGenerationTask("text-generation"),
+        "conversational": TogetherConversationalTask(),
+        "text-generation": TogetherTextGenerationTask(),
     },
 }
 
 
@@ -20,6 +20,7 @@
     "fal-ai": {},
     "fireworks-ai": {},
     "hf-inference": {},
+    "hyperbolic": {},
     "replicate": {},
     "sambanova": {},
     "together": {},
@@ -179,6 +180,38 @@ def _prepare_payload_as_bytes(
         return None
 
 
+class BaseConversationalTask(TaskProviderHelper):
+    """
+    Base class for conversational (chat completion) tasks.
+    The schema follows the OpenAI API format defined here: https://platform.openai.com/docs/api-reference/chat
+    """
+
+    def __init__(self, provider: str, base_url: str):
+        super().__init__(provider=provider, base_url=base_url, task="conversational")
+
+    def _prepare_route(self, mapped_model: str) -> str:
+        return "/v1/chat/completions"
+
+    def _prepare_payload_as_dict(self, inputs: Any, parameters: Dict, mapped_model: str) -> Optional[Dict]:
+        return {"messages": inputs, **filter_none(parameters), "model": mapped_model}
+
+
+class BaseTextGenerationTask(TaskProviderHelper):
+    """
+    Base class for text-generation (completion) tasks.
+    The schema follows the OpenAI API format defined here: https://platform.openai.com/docs/api-reference/completions
+    """
+
+    def __init__(self, provider: str, base_url: str):
+        super().__init__(provider=provider, base_url=base_url, task="text-generation")
+
+    def _prepare_route(self, mapped_model: str) -> str:
+        return "/v1/completions"
+
+    def _prepare_payload_as_dict(self, inputs: Any, parameters: Dict, mapped_model: str) -> Optional[Dict]:
+        return {"prompt": inputs, **filter_none(parameters), "model": mapped_model}
+
+
 @lru_cache(maxsize=None)
 def _fetch_inference_provider_mapping(model: str) -> Dict:
     """
 
@@ -1,14 +1,6 @@
-from typing import Any, Dict, Optional
+from ._common import BaseConversationalTask
 
-from ._common import TaskProviderHelper, filter_none
 
-
-class FireworksAIConversationalTask(TaskProviderHelper):
+class FireworksAIConversationalTask(BaseConversationalTask):
     def __init__(self):
-        super().__init__(provider="fireworks-ai", base_url="https://api.fireworks.ai/inference", task="conversational")
-
-    def _prepare_route(self, mapped_model: str) -> str:
-        return "/v1/chat/completions"
-
-    def _prepare_payload_as_dict(self, inputs: Any, parameters: Dict, mapped_model: str) -> Optional[Dict]:
-        return {"messages": inputs, **filter_none(parameters), "model": mapped_model}
+        super().__init__(provider="fireworks-ai", base_url="https://api.fireworks.ai/inference")
@@ -0,0 +1,43 @@
+import base64
+from typing import Any, Dict, Optional, Union
+
+from huggingface_hub.inference._common import _as_dict
+from huggingface_hub.inference._providers._common import BaseConversationalTask, TaskProviderHelper, filter_none
+
+
+class HyperbolicTextToImageTask(TaskProviderHelper):
+    def __init__(self):
+        super().__init__(provider="hyperbolic", base_url="https://api.hyperbolic.xyz", task="text-to-image")
+
+    def _prepare_route(self, mapped_model: str) -> str:
+        return "/v1/images/generations"
+
+    def _prepare_payload_as_dict(self, inputs: Any, parameters: Dict, mapped_model: str) -> Optional[Dict]:
+        parameters = filter_none(parameters)
+        if "num_inference_steps" in parameters:
+            parameters["steps"] = parameters.pop("num_inference_steps")
+        if "guidance_scale" in parameters:
+            parameters["cfg_scale"] = parameters.pop("guidance_scale")
+        # For Hyperbolic, the width and height are required parameters
+        if "width" not in parameters:
+            parameters["width"] = 512
+        if "height" not in parameters:
+            parameters["height"] = 512
+        return {"prompt": inputs, "model_name": mapped_model, **parameters}
+
+    def get_response(self, response: Union[bytes, Dict]) -> Any:
+        response_dict = _as_dict(response)
+        return base64.b64decode(response_dict["images"][0]["image"])
+
+
+class HyperbolicTextGenerationTask(BaseConversationalTask):
+    """
+    Special case for Hyperbolic, where text-generation task is handled as a conversational task.
+    """
+
+    def __init__(self, task: str):
+        super().__init__(
+            provider="hyperbolic",
+            base_url="https://api.hyperbolic.xyz",
+        )
+        self.task = task
@@ -10,6 +10,8 @@ Implement the methods that require custom handling. Check out the base implement
 
 If the provider supports multiple tasks that require different implementations, create dedicated subclasses for each task, following the pattern shown in `fal_ai.py`.
 
+For `text-generation` and `conversational` tasks, one can just inherit from `BaseTextGenerationTask` and `BaseConversationalTask` respectively (defined in `_common.py`) and override the methods if needed. Examples can be found in `fireworks_ai.py` and `together.py`.
+
 ```py
 from typing import Any, Dict, Optional, Union
 
 
@@ -1,14 +1,6 @@
-from typing import Any, Dict, Optional
+from huggingface_hub.inference._providers._common import BaseConversationalTask
 
-from huggingface_hub.inference._providers._common import TaskProviderHelper, filter_none
 
-
-class SambanovaConversationalTask(TaskProviderHelper):
+class SambanovaConversationalTask(BaseConversationalTask):
     def __init__(self):
-        super().__init__(provider="sambanova", base_url="https://api.sambanova.ai", task="conversational")
-
-    def _prepare_route(self, mapped_model: str) -> str:
-        return "/v1/chat/completions"
-
-    def _prepare_payload_as_dict(self, inputs: Any, parameters: Dict, mapped_model: str) -> Optional[Dict]:
-        return {"messages": inputs, **filter_none(parameters), "model": mapped_model}
+        super().__init__(provider="sambanova", base_url="https://api.sambanova.ai")