huggingface
diff --git a/‎docs/source/en/guides/inference.md
Lines changed: 30 additions & 30 deletions b/‎docs/source/en/guides/inference.md
Lines changed: 30 additions & 30 deletions
diff --git a/‎src/huggingface_hub/inference/_client.py
Lines changed: 1 addition & 1 deletion b/‎src/huggingface_hub/inference/_client.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/huggingface_hub/inference/_generated/_async_client.py
Lines changed: 1 addition & 1 deletion b/‎src/huggingface_hub/inference/_generated/_async_client.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/huggingface_hub/inference/_providers/__init__.py
Lines changed: 6 additions & 0 deletions b/‎src/huggingface_hub/inference/_providers/__init__.py
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/huggingface_hub/inference/_providers/novita.py
Lines changed: 26 additions & 0 deletions b/‎src/huggingface_hub/inference/_providers/novita.py
Lines changed: 26 additions & 0 deletions
diff --git a/‎src/huggingface_hub/inference/_providers/replicate.py
Lines changed: 5 additions & 1 deletion b/‎src/huggingface_hub/inference/_providers/replicate.py
Lines changed: 5 additions & 1 deletion
diff --git a/‎src/huggingface_hub/inference/_providers/together.py
Lines changed: 7 additions & 3 deletions b/‎src/huggingface_hub/inference/_providers/together.py
Lines changed: 7 additions & 3 deletions
@@ -248,36 +248,36 @@ You might wonder why using [`InferenceClient`] instead of OpenAI's client? There
 
 [`InferenceClient`]'s goal is to provide the easiest interface to run inference on Hugging Face models, on any provider. It has a simple API that supports the most common tasks. Here is a table showing which providers support which tasks:
 
-| Domain              | Task                                                | HF Inference | fal-ai | Fireworks AI | Hyperbolic | Replicate | Sambanova | Together |
-| ------------------- | --------------------------------------------------- | ------------ | ------ | ------------ | ---------- | --------- | --------- | -------- |
-| **Audio**           | [`~InferenceClient.audio_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.audio_to_audio`]                 | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.automatic_speech_recognition`]   | ✅            | ✅      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.text_to_speech`]                 | ✅            | ❌      | ❌            | ❌          | ✅         | ❌         | ❌        |
-| **Computer Vision** | [`~InferenceClient.image_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.image_segmentation`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.image_to_image`]                 | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.image_to_text`]                  | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.object_detection`]               | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.text_to_image`]                  | ✅            | ✅      | ❌            | ✅          | ✅         | ❌         | ✅        |
-|                     | [`~InferenceClient.text_to_video`]                  | ❌            | ✅      | ❌            | ❌          | ✅         | ❌         | ❌        |
-|                     | [`~InferenceClient.zero_shot_image_classification`] | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-| **Multimodal**      | [`~InferenceClient.document_question_answering`]    | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.visual_question_answering`]      | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-| **NLP**             | [`~InferenceClient.chat_completion`]                | ✅            | ❌      | ✅            | ✅          | ❌         | ✅         | ✅        |
-|                     | [`~InferenceClient.feature_extraction`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.fill_mask`]                      | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.question_answering`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.sentence_similarity`]            | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.summarization`]                  | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.table_question_answering`]       | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.text_classification`]            | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.text_generation`]                | ✅            | ❌      | ❌            | ✅          | ❌         | ❌         | ✅        |
-|                     | [`~InferenceClient.token_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.translation`]                    | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.zero_shot_classification`]       | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-| **Tabular**         | [`~InferenceClient.tabular_classification`]         | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
-|                     | [`~InferenceClient.tabular_regression`]             | ✅            | ❌      | ❌            | ❌          | ❌         | ❌         | ❌        |
+| Domain              | Task                                                | HF Inference | fal-ai | Fireworks AI | Hyperbolic | Novita AI | Replicate | Sambanova | Together |
+| ------------------- | --------------------------------------------------- | ------------ | ------ | ------------ | ---------- | ------ | --------- | --------- | -------- |
+| **Audio**           | [`~InferenceClient.audio_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.audio_to_audio`]                 | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.automatic_speech_recognition`]   | ✅            | ✅      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_to_speech`]                 | ✅            | ❌      | ❌            | ❌          | ❌      | ✅         | ❌         | ❌        |
+| **Computer Vision** | [`~InferenceClient.image_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.image_segmentation`]             | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.image_to_image`]                 | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.image_to_text`]                  | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.object_detection`]               | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_to_image`]                  | ✅            | ✅      | ❌            | ✅          | ❌      | ✅         | ❌         | ✅        |
+|                     | [`~InferenceClient.text_to_video`]                  | ❌            | ✅      | ❌            | ❌          | ❌      | ✅         | ❌         | ❌        |
+|                     | [`~InferenceClient.zero_shot_image_classification`] | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+| **Multimodal**      | [`~InferenceClient.document_question_answering`]    | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.visual_question_answering`]      | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+| **NLP**             | [`~InferenceClient.chat_completion`]                | ✅            | ❌      | ✅            | ✅          | ✅      | ❌         | ✅         | ✅        |
+|                     | [`~InferenceClient.feature_extraction`]             | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.fill_mask`]                      | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.question_answering`]             | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.sentence_similarity`]            | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.summarization`]                  | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.table_question_answering`]       | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_classification`]            | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.text_generation`]                | ✅            | ❌      | ❌            | ✅          | ✅      | ❌         | ❌         | ✅        |
+|                     | [`~InferenceClient.token_classification`]           | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.translation`]                    | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.zero_shot_classification`]       | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+| **Tabular**         | [`~InferenceClient.tabular_classification`]         | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
+|                     | [`~InferenceClient.tabular_regression`]             | ✅            | ❌      | ❌            | ❌          | ❌      | ❌         | ❌         | ❌        |
 
 <Tip>
 
 
@@ -132,7 +132,7 @@ class InferenceClient:
             path will be appended to the base URL (see the [TGI Messages API](https://huggingface.co/docs/text-generation-inference/en/messages_api)
             documentation for details). When passing a URL as `model`, the client will not append any suffix path to it.
         provider (`str`, *optional*):
-            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"hf-inference"`, `"hyperbolic"`, `"replicate"`, "sambanova"` or `"together"`.
+            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"hf-inference"`, `"hyperbolic"`, `"novita"`, `"replicate"`, "sambanova"` or `"together"`.
             defaults to hf-inference (Hugging Face Serverless Inference API).
             If model is a URL or `base_url` is passed, then `provider` is not used.
         token (`str` or `bool`, *optional*):
 
@@ -120,7 +120,7 @@ class AsyncInferenceClient:
             path will be appended to the base URL (see the [TGI Messages API](https://huggingface.co/docs/text-generation-inference/en/messages_api)
             documentation for details). When passing a URL as `model`, the client will not append any suffix path to it.
         provider (`str`, *optional*):
-            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"hf-inference"`, `"hyperbolic"`, `"replicate"`, "sambanova"` or `"together"`.
+            Name of the provider to use for inference. Can be "fal-ai"`, `"fireworks-ai"`, `"hf-inference"`, `"hyperbolic"`, `"novita"`, `"replicate"`, "sambanova"` or `"together"`.
             defaults to hf-inference (Hugging Face Serverless Inference API).
             If model is a URL or `base_url` is passed, then `provider` is not used.
         token (`str` or `bool`, *optional*):
 
@@ -10,6 +10,7 @@
 from .fireworks_ai import FireworksAIConversationalTask
 from .hf_inference import HFInferenceBinaryInputTask, HFInferenceConversational, HFInferenceTask
 from .hyperbolic import HyperbolicTextGenerationTask, HyperbolicTextToImageTask
+from .novita import NovitaConversationalTask, NovitaTextGenerationTask
 from .replicate import ReplicateTask, ReplicateTextToSpeechTask
 from .sambanova import SambanovaConversationalTask
 from .together import TogetherConversationalTask, TogetherTextGenerationTask, TogetherTextToImageTask
@@ -20,6 +21,7 @@
     "fireworks-ai",
     "hf-inference",
     "hyperbolic",
+    "novita",
     "replicate",
     "sambanova",
     "together",
@@ -68,6 +70,10 @@
         "conversational": HyperbolicTextGenerationTask("conversational"),
         "text-generation": HyperbolicTextGenerationTask("text-generation"),
     },
+    "novita": {
+        "text-generation": NovitaTextGenerationTask(),
+        "conversational": NovitaConversationalTask(),
+    },
     "replicate": {
         "text-to-image": ReplicateTask("text-to-image"),
         "text-to-speech": ReplicateTextToSpeechTask(),
 
@@ -0,0 +1,26 @@
+from huggingface_hub.inference._providers._common import (
+    BaseConversationalTask,
+    BaseTextGenerationTask,
+)
+
+
+_PROVIDER = "novita"
+_BASE_URL = "https://api.novita.ai/v3/openai"
+
+
+class NovitaTextGenerationTask(BaseTextGenerationTask):
+    def __init__(self):
+        super().__init__(provider=_PROVIDER, base_url=_BASE_URL)
+
+    def _prepare_route(self, mapped_model: str) -> str:
+        # there is no v1/ route for novita
+        return "/completions"
+
+
+class NovitaConversationalTask(BaseConversationalTask):
+    def __init__(self):
+        super().__init__(provider=_PROVIDER, base_url=_BASE_URL)
+
+    def _prepare_route(self, mapped_model: str) -> str:
+        # there is no v1/ route for novita
+        return "/chat/completions"
@@ -5,9 +5,13 @@
 from huggingface_hub.utils import get_session
 
 
+_PROVIDER = "replicate"
+_BASE_URL = "https://api.replicate.com"
+
+
 class ReplicateTask(TaskProviderHelper):
     def __init__(self, task: str):
-        super().__init__(provider="replicate", base_url="https://api.replicate.com", task=task)
+        super().__init__(provider=_PROVIDER, base_url=_BASE_URL, task=task)
 
     def _prepare_headers(self, headers: Dict, api_key: str) -> Dict:
         headers = super()._prepare_headers(headers, api_key)
 
@@ -11,11 +11,15 @@
 )
 
 
+_PROVIDER = "together"
+_BASE_URL = "https://api.together.xyz"
+
+
 class TogetherTask(TaskProviderHelper, ABC):
     """Base class for Together API tasks."""
 
     def __init__(self, task: str):
-        super().__init__(provider="together", base_url="https://api.together.xyz", task=task)
+        super().__init__(provider=_PROVIDER, base_url=_BASE_URL, task=task)
 
     def _prepare_route(self, mapped_model: str) -> str:
         if self.task == "text-to-image":
@@ -29,12 +33,12 @@ def _prepare_route(self, mapped_model: str) -> str:
 
 class TogetherTextGenerationTask(BaseTextGenerationTask):
     def __init__(self):
-        super().__init__(provider="together", base_url="https://api.together.xyz")
+        super().__init__(provider=_PROVIDER, base_url=_BASE_URL)
 
 
 class TogetherConversationalTask(BaseConversationalTask):
     def __init__(self):
-        super().__init__(provider="together", base_url="https://api.together.xyz")
+        super().__init__(provider=_PROVIDER, base_url=_BASE_URL)
 
 
 class TogetherTextToImageTask(TogetherTask):