diff --git a/.github/workflows/api_inference_build_documentation.yml b/.github/workflows/api_inference_build_documentation.yml
index 903d8b96e..da805071a 100644
--- a/.github/workflows/api_inference_build_documentation.yml
+++ b/.github/workflows/api_inference_build_documentation.yml
@@ -3,7 +3,7 @@ name: Build Inference API documentation
 on:
   push:
     paths:
-      - "docs/api-inference/**"
+      - "docs/inference-providers/**"
     branches:
       - main
 
@@ -13,8 +13,8 @@ jobs:
     with:
       commit_sha: ${{ github.sha }}
       package: hub-docs
-      package_name: api-inference
-      path_to_docs: hub-docs/docs/api-inference/
+      package_name: inference-providers
+      path_to_docs: hub-docs/docs/inference-providers/
       additional_args: --not_python_module
     secrets:
       hf_token: ${{ secrets.HF_DOC_BUILD_PUSH }}
diff --git a/.github/workflows/api_inference_build_pr_documentation.yml b/.github/workflows/api_inference_build_pr_documentation.yml
index 632dd68c7..5073baad4 100644
--- a/.github/workflows/api_inference_build_pr_documentation.yml
+++ b/.github/workflows/api_inference_build_pr_documentation.yml
@@ -3,7 +3,7 @@ name: Build Inference API PR Documentation
 on:
   pull_request:
     paths:
-      - "docs/api-inference/**"
+      - "docs/inference-providers/**"
 
 concurrency:
   group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }}
@@ -16,6 +16,6 @@ jobs:
       commit_sha: ${{ github.event.pull_request.head.sha }}
       pr_number: ${{ github.event.number }}
       package: hub-docs
-      package_name: api-inference
-      path_to_docs: hub-docs/docs/api-inference/
+      package_name: inference-providers
+      path_to_docs: hub-docs/docs/inference-providers/
       additional_args: --not_python_module
diff --git a/.github/workflows/api_inference_generate_documentation.yml b/.github/workflows/api_inference_generate_documentation.yml
index 9be09b4eb..0ac167453 100644
--- a/.github/workflows/api_inference_generate_documentation.yml
+++ b/.github/workflows/api_inference_generate_documentation.yml
@@ -23,23 +23,23 @@ jobs:
         with:
           run_install: |
             - recursive: true
-              cwd: ./scripts/api-inference
+              cwd: ./scripts/inference-providers
               args: [--frozen-lockfile]
-          package_json_file: ./scripts/api-inference/package.json
+          package_json_file: ./scripts/inference-providers/package.json
       - name: Update huggingface/tasks package
-        working-directory: ./scripts/api-inference
+        working-directory: ./scripts/inference-providers
         run: |
           pnpm update @huggingface/tasks@latest
       # Generate
       - name: Generate API inference documentation
         run: pnpm run generate
-        working-directory: ./scripts/api-inference
+        working-directory: ./scripts/inference-providers
 
       # Check changes
       - name: Check changes
         run: |
           git diff --name-only > changed_files.txt
-          if grep -v -E "^(scripts/api-inference/package.json|scripts/api-inference/pnpm-lock.yaml)$" changed_files.txt | grep -q '.'; then
+          if grep -v -E "^(scripts/inference-providers/package.json|scripts/inference-providers/pnpm-lock.yaml)$" changed_files.txt | grep -q '.'; then
             echo "changes_detected=true" >> $GITHUB_ENV
           else
             echo "changes_detected=false" >> $GITHUB_ENV
@@ -58,13 +58,13 @@ jobs:
         with:
           token: ${{ secrets.TOKEN_INFERENCE_SYNC_BOT }}
           commit-message: Update API inference documentation (automated)
-          branch: update-api-inference-docs-automated-pr
+          branch: update-inference-providers-docs-automated-pr
           delete-branch: true
           title: "[Bot] Update API inference documentation"
           body: |
             This PR automatically upgrades the `@huggingface/tasks` package and regenerates the API inference documentation by running:
             ```sh
-            cd scripts/api-inference
+            cd scripts/inference-providers
             pnpm update @huggingface/tasks@latest
             pnpm run generate
             ```
diff --git a/.github/workflows/api_inference_upload_pr_documentation.yml b/.github/workflows/api_inference_upload_pr_documentation.yml
index c2c2ab4e0..5df163466 100644
--- a/.github/workflows/api_inference_upload_pr_documentation.yml
+++ b/.github/workflows/api_inference_upload_pr_documentation.yml
@@ -10,7 +10,7 @@ jobs:
   build:
     uses: huggingface/doc-builder/.github/workflows/upload_pr_documentation.yml@main
     with:
-      package_name: api-inference
+      package_name: inference-providers
     secrets:
       hf_token: ${{ secrets.HF_DOC_BUILD_PUSH }}
       comment_bot_token: ${{ secrets.COMMENT_BOT_TOKEN }}
\ No newline at end of file
diff --git a/docs/hub/billing.md b/docs/hub/billing.md
index 9bf4fed6a..6e9f65c26 100644
--- a/docs/hub/billing.md
+++ b/docs/hub/billing.md
@@ -25,9 +25,10 @@ Private repository storage above the [included storage](./storage-limits) will b
 
 The PRO subscription unlocks additional features for users, including:
 
-- Higher free tier for the Serverless Inference API and when consuming ZeroGPU Spaces
-- Higher [storage capacity](./storage-limits) for private repositories
+- Higher tier for ZeroGPU Spaces usage
 - Ability to create ZeroGPU Spaces and use Dev Mode
+- Included credits for [Inference Providers](/docs/inference-providers/)
+- Higher [storage capacity](./storage-limits) for private repositories
 - Ability to write Social Posts and Community Blogs
 - Leverage the Dataset Viewer on private datasets
 
@@ -48,7 +49,7 @@ It is billed with the renewal invoices of your PRO or Enterprise Hub subscriptio
 
 ## Compute Services on the Hub
 
-We also directly provide compute services with [Spaces](./spaces), [Inference Endpoints](https://huggingface.co/docs/inference-endpoints/index) and the [Serverless Inference API](https://huggingface.co/docs/api-inference/index).
+We also directly provide compute services with [Spaces](./spaces), [Inference Endpoints](https://huggingface.co/docs/inference-endpoints/index) and [Inference Providers](https://huggingface.co/docs/inference-providers/index).
 
 While most of our compute services have a comprehensive free tier, users and organizations can pay to access more powerful hardware accelerators.
 
diff --git a/docs/hub/models-inference.md b/docs/hub/models-inference.md
index 0301ff5ca..fd785995d 100644
--- a/docs/hub/models-inference.md
+++ b/docs/hub/models-inference.md
@@ -1,9 +1,9 @@
-# Serverless Inference API
+# Inference Providers
 
-Please refer to [Serverless Inference API Documentation](https://huggingface.co/docs/api-inference) for detailed information.
+Please refer to the [Inference Providers Documentation](https://huggingface.co/docs/inference-providers) for detailed information.
 
 
-## What technology do you use to power the Serverless Inference API?
+## What technology do you use to power the HF-Inference API?
 
 For 🤗 Transformers models, [Pipelines](https://huggingface.co/docs/transformers/main_classes/pipelines) power the API.
 
@@ -14,13 +14,13 @@ On top of `Pipelines` and depending on the model type, there are several product
 
 For models from [other libraries](./models-libraries), the API uses [Starlette](https://www.starlette.io) and runs in [Docker containers](https://github.com/huggingface/api-inference-community/tree/main/docker_images). Each library defines the implementation of [different pipelines](https://github.com/huggingface/api-inference-community/tree/main/docker_images/sentence_transformers/app/pipelines).
 
-## How can I turn off the Serverless Inference API for my model?
+## How can I turn off the HF-Inference API for my model?
 
 Specify `inference: false` in your model card's metadata.
 
 ## Why don't I see an inference widget, or why can't I use the API?
 
-For some tasks, there might not be support in the Serverless Inference API, and, hence, there is no widget.
+For some tasks, there might not be support in the HF-Inference API, and, hence, there is no widget.
 For all libraries (except 🤗 Transformers), there is a [library-to-tasks.ts file](https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/library-to-tasks.ts) of supported tasks in the API. When a model repository has a task that is not supported by the repository library, the repository has `inference: false` by default.
 
 ## Can I send large volumes of requests? Can I get accelerated APIs?
@@ -31,6 +31,6 @@ If you are interested in accelerated inference, higher volumes of requests, or a
 
 You can check your usage in the [Inference Dashboard](https://ui.endpoints.huggingface.co/endpoints). The dashboard shows both your serverless and dedicated endpoints usage.
 
-## Is there programmatic access to the Serverless Inference API?
+## Is there programmatic access to the HF-Inference API?
 
-Yes, the `huggingface_hub` library has a client wrapper documented [here](https://huggingface.co/docs/huggingface_hub/how-to-inference).
+Yes, the `huggingface_hub` library has a client wrapper documented [here](https://huggingface.co/docs/huggingface_hub/guides/inference).
diff --git a/docs/hub/models-the-hub.md b/docs/hub/models-the-hub.md
index 82e103562..6a0dd6b69 100644
--- a/docs/hub/models-the-hub.md
+++ b/docs/hub/models-the-hub.md
@@ -2,7 +2,7 @@
 
 ## What is the Model Hub?
 
-The Model Hub is where the members of the Hugging Face community can host all of their model checkpoints for simple storage, discovery, and sharing. Download pre-trained models with the [`huggingface_hub` client library](https://huggingface.co/docs/huggingface_hub/index), with 🤗  [`Transformers`](https://huggingface.co/docs/transformers/index) for fine-tuning and other usages or with any of the over [15 integrated libraries](./models-libraries). You can even leverage the [Serverless Inference API](./models-inference) or [Inference Endpoints](https://huggingface.co/docs/inference-endpoints). to use models in production settings.
+The Model Hub is where the members of the Hugging Face community can host all of their model checkpoints for simple storage, discovery, and sharing. Download pre-trained models with the [`huggingface_hub` client library](https://huggingface.co/docs/huggingface_hub/index), with 🤗  [`Transformers`](https://huggingface.co/docs/transformers/index) for fine-tuning and other usages or with any of the over [15 integrated libraries](./models-libraries). You can even leverage [Inference Providers](/docs/inference-providers/) or [Inference Endpoints](https://huggingface.co/docs/inference-endpoints) to use models in production settings.
 
 You can refer to the following video for a guide on navigating the Model Hub:
 
diff --git a/docs/hub/models-widgets.md b/docs/hub/models-widgets.md
index 33e76841c..42c237e0c 100644
--- a/docs/hub/models-widgets.md
+++ b/docs/hub/models-widgets.md
@@ -168,9 +168,9 @@ Here are some links to examples:
 - `table-question-answering`, for instance [`google/tapas-base-finetuned-wtq`](https://huggingface.co/google/tapas-base-finetuned-wtq)
 - `sentence-similarity`, for instance [`osanseviero/full-sentence-distillroberta2`](/osanseviero/full-sentence-distillroberta2)
 
-## How can I control my model's widget Inference API parameters?
+## How can I control my model's widget HF-Inference API parameters?
 
-Generally, the Inference API for a model uses the default pipeline settings associated with each task. But if you'd like to change the pipeline's default settings and specify additional inference parameters, you can configure the parameters directly through the model card metadata. Refer [here](https://huggingface.co/docs/api-inference/detailed_parameters) for some of the most commonly used parameters associated with each task.
+Generally, the HF-Inference API for a model uses the default pipeline settings associated with each task. But if you'd like to change the pipeline's default settings and specify additional inference parameters, you can configure the parameters directly through the model card metadata. Refer [here](https://huggingface.co/docs/inference-providers/detailed_parameters) for some of the most commonly used parameters associated with each task.
 
 For example, if you want to specify an aggregation strategy for a NER task in the widget:
 
@@ -188,4 +188,6 @@ inference:
     temperature: 0.7
 ``` 
 
-The Serverless inference API allows you to send HTTP requests to models in the Hugging Face Hub programatically. ⚡⚡ Learn more about it by reading the [Inference API documentation](./models-inference). Finally, you can also deploy all those models to dedicated [Inference Endpoints](https://huggingface.co/docs/inference-endpoints).
+Inference Providers allows you to send HTTP requests to models in the Hugging Face Hub programatically. It is an abstraction layer on top of External providers. ⚡⚡ Learn more about it by reading the [
+Inference Providers documentation](/docs/inference-providers). 
+Finally, you can also deploy all those models to dedicated [Inference Endpoints](https://huggingface.co/docs/inference-endpoints).
diff --git a/docs/hub/oauth.md b/docs/hub/oauth.md
index e0b5ee8d0..778475d60 100644
--- a/docs/hub/oauth.md
+++ b/docs/hub/oauth.md
@@ -35,7 +35,7 @@ The currently supported scopes are:
 - `read-repos`: Get read access to the user's personal repos.
 - `write-repos`: Get write/read access to the user's personal repos.
 - `manage-repos`: Get full access to the user's personal repos. Also grants repo creation and deletion.
-- `inference-api`: Get access to the [Inference API](https://huggingface.co/docs/api-inference/index), you will be able to make inference requests on behalf of the user.
+- `inference-api`: Get access to the [Inference API](https://huggingface.co/docs/inference-providers/index), you will be able to make inference requests on behalf of the user.
 - `write-discussions`: Open discussions and Pull Requests on behalf of the user as well as interact with discussions (including reactions, posting/editing comments, closing discussions, ...). To open Pull Requests on private repos, you need to request the `read-repos` scope as well.
 
 All other information is available in the [OpenID metadata](https://huggingface.co/.well-known/openid-configuration).
diff --git a/docs/hub/spaces-oauth.md b/docs/hub/spaces-oauth.md
index 7323e7c7a..6e262762a 100644
--- a/docs/hub/spaces-oauth.md
+++ b/docs/hub/spaces-oauth.md
@@ -81,7 +81,7 @@ Those scopes are optional and can be added by setting `hf_oauth_scopes` in your
 - `read-repos`: Get read access to the user's personal repos.
 - `write-repos`: Get write/read access to the user's personal repos.
 - `manage-repos`: Get full access to the user's personal repos. Also grants repo creation and deletion.
-- `inference-api`: Get access to the [Inference API](https://huggingface.co/docs/api-inference/index), you will be able to make inference requests on behalf of the user.
+- `inference-api`: Get access to the [Inference API](https://huggingface.co/docs/inference-providers/index), you will be able to make inference requests on behalf of the user.
 - `write-discussions`: Open discussions and Pull Requests on behalf of the user as well as interact with discussions (including reactions, posting/editing comments, closing discussions, ...). To open Pull Requests on private repos, you need to request the `read-repos` scope as well.
 
 ## Accessing organization resources
diff --git a/docs/hub/spaces-sdks-docker-langfuse.md b/docs/hub/spaces-sdks-docker-langfuse.md
index 6ca90d18e..449952f30 100644
--- a/docs/hub/spaces-sdks-docker-langfuse.md
+++ b/docs/hub/spaces-sdks-docker-langfuse.md
@@ -79,7 +79,7 @@ Langfuse maintains native integrations with many popular LLM frameworks, includi
 
 ### Example 1: Trace Calls to HF Serverless API
 
-As a simple example, here's how to trace LLM calls to the [HF Serverless API](https://huggingface.co/docs/api-inference/en/index) using the Langfuse Python SDK.
+As a simple example, here's how to trace LLM calls to the [HF Serverless API](https://huggingface.co/docs/inference-providers/en/index) using the Langfuse Python SDK.
 
 Be sure to first configure your `LANGFUSE_HOST`, `LANGFUSE_PUBLIC_KEY` and `LANGFUSE_SECRET_KEY` environment variables, and make sure you've [authenticated with your Hugging Face account](https://huggingface.co/docs/huggingface_hub/en/quick-start#authentication).
 
diff --git a/docs/api-inference/_redirects.yml b/docs/inference-providers/_redirects.yml
similarity index 100%
rename from docs/api-inference/_redirects.yml
rename to docs/inference-providers/_redirects.yml
diff --git a/docs/api-inference/_toctree.yml b/docs/inference-providers/_toctree.yml
similarity index 100%
rename from docs/api-inference/_toctree.yml
rename to docs/inference-providers/_toctree.yml
diff --git a/docs/api-inference/hub-api.md b/docs/inference-providers/hub-api.md
similarity index 100%
rename from docs/api-inference/hub-api.md
rename to docs/inference-providers/hub-api.md
diff --git a/docs/api-inference/hub-integration.md b/docs/inference-providers/hub-integration.md
similarity index 100%
rename from docs/api-inference/hub-integration.md
rename to docs/inference-providers/hub-integration.md
diff --git a/docs/api-inference/index.md b/docs/inference-providers/index.md
similarity index 100%
rename from docs/api-inference/index.md
rename to docs/inference-providers/index.md
diff --git a/docs/api-inference/pricing.md b/docs/inference-providers/pricing.md
similarity index 100%
rename from docs/api-inference/pricing.md
rename to docs/inference-providers/pricing.md
diff --git a/docs/api-inference/security.md b/docs/inference-providers/security.md
similarity index 100%
rename from docs/api-inference/security.md
rename to docs/inference-providers/security.md
diff --git a/docs/api-inference/tasks/audio-classification.md b/docs/inference-providers/tasks/audio-classification.md
similarity index 97%
rename from docs/api-inference/tasks/audio-classification.md
rename to docs/inference-providers/tasks/audio-classification.md
index 47144b754..eea7b1daa 100644
--- a/docs/api-inference/tasks/audio-classification.md
+++ b/docs/inference-providers/tasks/audio-classification.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/audio-classification.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/audio-classification.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/audio-classification/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/audio-classification/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/automatic-speech-recognition.md b/docs/inference-providers/tasks/automatic-speech-recognition.md
similarity index 98%
rename from docs/api-inference/tasks/automatic-speech-recognition.md
rename to docs/inference-providers/tasks/automatic-speech-recognition.md
index c28a10f14..b4e07884a 100644
--- a/docs/api-inference/tasks/automatic-speech-recognition.md
+++ b/docs/inference-providers/tasks/automatic-speech-recognition.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/automatic-speech-recognition.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/automatic-speech-recognition.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/automatic-speech-recognition/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/automatic-speech-recognition/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/chat-completion.md b/docs/inference-providers/tasks/chat-completion.md
similarity index 98%
rename from docs/api-inference/tasks/chat-completion.md
rename to docs/inference-providers/tasks/chat-completion.md
index e4aac572d..e9b60b63f 100644
--- a/docs/api-inference/tasks/chat-completion.md
+++ b/docs/inference-providers/tasks/chat-completion.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/chat-completion.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/chat-completion.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/chat-completion/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/chat-completion/spec/output.json
 - the snippets used to generate the example:
@@ -15,7 +15,7 @@ For more details, check out:
 ## Chat Completion
 
 Generate a response given a list of messages in a conversational context, supporting both conversational Language Models (LLMs) and conversational Vision-Language Models (VLMs).
-This is a subtask of [`text-generation`](https://huggingface.co/docs/api-inference/tasks/text-generation) and [`image-text-to-text`](https://huggingface.co/docs/api-inference/tasks/image-text-to-text).
+This is a subtask of [`text-generation`](https://huggingface.co/docs/inference-providers/tasks/text-generation) and [`image-text-to-text`](https://huggingface.co/docs/inference-providers/tasks/image-text-to-text).
 
 ### Recommended models
 
diff --git a/docs/api-inference/tasks/feature-extraction.md b/docs/inference-providers/tasks/feature-extraction.md
similarity index 97%
rename from docs/api-inference/tasks/feature-extraction.md
rename to docs/inference-providers/tasks/feature-extraction.md
index fc707ad85..6b2d641a6 100644
--- a/docs/api-inference/tasks/feature-extraction.md
+++ b/docs/inference-providers/tasks/feature-extraction.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/feature-extraction.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/feature-extraction.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/feature-extraction/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/feature-extraction/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/fill-mask.md b/docs/inference-providers/tasks/fill-mask.md
similarity index 97%
rename from docs/api-inference/tasks/fill-mask.md
rename to docs/inference-providers/tasks/fill-mask.md
index 70e7c256c..6f835c2e1 100644
--- a/docs/api-inference/tasks/fill-mask.md
+++ b/docs/inference-providers/tasks/fill-mask.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/fill-mask.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/fill-mask.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/fill-mask/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/fill-mask/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/image-classification.md b/docs/inference-providers/tasks/image-classification.md
similarity index 96%
rename from docs/api-inference/tasks/image-classification.md
rename to docs/inference-providers/tasks/image-classification.md
index 0a0eb78c8..14d7e6617 100644
--- a/docs/api-inference/tasks/image-classification.md
+++ b/docs/inference-providers/tasks/image-classification.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/image-classification.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/image-classification.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/image-classification/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/image-classification/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/image-segmentation.md b/docs/inference-providers/tasks/image-segmentation.md
similarity index 97%
rename from docs/api-inference/tasks/image-segmentation.md
rename to docs/inference-providers/tasks/image-segmentation.md
index 459b5037d..3b69a3fa9 100644
--- a/docs/api-inference/tasks/image-segmentation.md
+++ b/docs/inference-providers/tasks/image-segmentation.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/image-segmentation.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/image-segmentation.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/image-segmentation/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/image-segmentation/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/image-to-image.md b/docs/inference-providers/tasks/image-to-image.md
similarity index 96%
rename from docs/api-inference/tasks/image-to-image.md
rename to docs/inference-providers/tasks/image-to-image.md
index 1103ef21f..3f7b90d09 100644
--- a/docs/api-inference/tasks/image-to-image.md
+++ b/docs/inference-providers/tasks/image-to-image.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/image-to-image.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/image-to-image.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/image-to-image/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/image-to-image/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/index.md b/docs/inference-providers/tasks/index.md
similarity index 100%
rename from docs/api-inference/tasks/index.md
rename to docs/inference-providers/tasks/index.md
diff --git a/docs/api-inference/tasks/object-detection.md b/docs/inference-providers/tasks/object-detection.md
similarity index 97%
rename from docs/api-inference/tasks/object-detection.md
rename to docs/inference-providers/tasks/object-detection.md
index b8fde8d08..879a213c0 100644
--- a/docs/api-inference/tasks/object-detection.md
+++ b/docs/inference-providers/tasks/object-detection.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/object-detection.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/object-detection.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/object-detection/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/object-detection/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/question-answering.md b/docs/inference-providers/tasks/question-answering.md
similarity index 97%
rename from docs/api-inference/tasks/question-answering.md
rename to docs/inference-providers/tasks/question-answering.md
index 0cca700b3..4d87390a7 100644
--- a/docs/api-inference/tasks/question-answering.md
+++ b/docs/inference-providers/tasks/question-answering.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/question-answering.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/question-answering.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/question-answering/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/question-answering/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/summarization.md b/docs/inference-providers/tasks/summarization.md
similarity index 98%
rename from docs/api-inference/tasks/summarization.md
rename to docs/inference-providers/tasks/summarization.md
index b55dfac70..f0a2cad81 100644
--- a/docs/api-inference/tasks/summarization.md
+++ b/docs/inference-providers/tasks/summarization.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/summarization.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/summarization.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/summarization/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/summarization/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/table-question-answering.md b/docs/inference-providers/tasks/table-question-answering.md
similarity index 97%
rename from docs/api-inference/tasks/table-question-answering.md
rename to docs/inference-providers/tasks/table-question-answering.md
index 8004ab9b0..272453407 100644
--- a/docs/api-inference/tasks/table-question-answering.md
+++ b/docs/inference-providers/tasks/table-question-answering.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/table-question-answering.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/table-question-answering.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/table-question-answering/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/table-question-answering/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/text-classification.md b/docs/inference-providers/tasks/text-classification.md
similarity index 97%
rename from docs/api-inference/tasks/text-classification.md
rename to docs/inference-providers/tasks/text-classification.md
index ed2458c0c..323b5a94c 100644
--- a/docs/api-inference/tasks/text-classification.md
+++ b/docs/inference-providers/tasks/text-classification.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/text-classification.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/text-classification.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/text-classification/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/text-classification/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/text-generation.md b/docs/inference-providers/tasks/text-generation.md
similarity index 98%
rename from docs/api-inference/tasks/text-generation.md
rename to docs/inference-providers/tasks/text-generation.md
index 7cedd2c76..cff2744ea 100644
--- a/docs/api-inference/tasks/text-generation.md
+++ b/docs/inference-providers/tasks/text-generation.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/text-generation.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/text-generation.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/text-generation/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/text-generation/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/text-to-image.md b/docs/inference-providers/tasks/text-to-image.md
similarity index 97%
rename from docs/api-inference/tasks/text-to-image.md
rename to docs/inference-providers/tasks/text-to-image.md
index 71bb3b141..fce58505d 100644
--- a/docs/api-inference/tasks/text-to-image.md
+++ b/docs/inference-providers/tasks/text-to-image.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/text-to-image.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/text-to-image.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/text-to-image/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/text-to-image/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/token-classification.md b/docs/inference-providers/tasks/token-classification.md
similarity index 98%
rename from docs/api-inference/tasks/token-classification.md
rename to docs/inference-providers/tasks/token-classification.md
index eeecde32c..f8834a596 100644
--- a/docs/api-inference/tasks/token-classification.md
+++ b/docs/inference-providers/tasks/token-classification.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/token-classification.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/token-classification.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/token-classification/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/token-classification/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/translation.md b/docs/inference-providers/tasks/translation.md
similarity index 97%
rename from docs/api-inference/tasks/translation.md
rename to docs/inference-providers/tasks/translation.md
index bc4939d7b..3a2a9cd16 100644
--- a/docs/api-inference/tasks/translation.md
+++ b/docs/inference-providers/tasks/translation.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/translation.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/translation.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/translation/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/translation/spec/output.json
 - the snippets used to generate the example:
diff --git a/docs/api-inference/tasks/zero-shot-classification.md b/docs/inference-providers/tasks/zero-shot-classification.md
similarity index 97%
rename from docs/api-inference/tasks/zero-shot-classification.md
rename to docs/inference-providers/tasks/zero-shot-classification.md
index 0b0d3a1a0..210e1334d 100644
--- a/docs/api-inference/tasks/zero-shot-classification.md
+++ b/docs/inference-providers/tasks/zero-shot-classification.md
@@ -1,8 +1,8 @@
 <!---
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/zero-shot-classification.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/zero-shot-classification.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/zero-shot-classification/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/zero-shot-classification/spec/output.json
 - the snippets used to generate the example:
diff --git a/scripts/api-inference/.gitignore b/scripts/inference-providers/.gitignore
similarity index 100%
rename from scripts/api-inference/.gitignore
rename to scripts/inference-providers/.gitignore
diff --git a/scripts/api-inference/.prettierignore b/scripts/inference-providers/.prettierignore
similarity index 100%
rename from scripts/api-inference/.prettierignore
rename to scripts/inference-providers/.prettierignore
diff --git a/scripts/api-inference/README.md b/scripts/inference-providers/README.md
similarity index 100%
rename from scripts/api-inference/README.md
rename to scripts/inference-providers/README.md
diff --git a/scripts/api-inference/package.json b/scripts/inference-providers/package.json
similarity index 93%
rename from scripts/api-inference/package.json
rename to scripts/inference-providers/package.json
index 3ae298c99..a5c16f8e5 100644
--- a/scripts/api-inference/package.json
+++ b/scripts/inference-providers/package.json
@@ -1,5 +1,5 @@
 {
-  "name": "api-inference-generator",
+  "name": "inference-providers-generator",
   "packageManager": "pnpm@9.7.1",
   "version": "1.0.0",
   "description": "",
diff --git a/scripts/api-inference/pnpm-lock.yaml b/scripts/inference-providers/pnpm-lock.yaml
similarity index 100%
rename from scripts/api-inference/pnpm-lock.yaml
rename to scripts/inference-providers/pnpm-lock.yaml
diff --git a/scripts/api-inference/scripts/.gitignore b/scripts/inference-providers/scripts/.gitignore
similarity index 100%
rename from scripts/api-inference/scripts/.gitignore
rename to scripts/inference-providers/scripts/.gitignore
diff --git a/scripts/api-inference/scripts/generate.ts b/scripts/inference-providers/scripts/generate.ts
similarity index 99%
rename from scripts/api-inference/scripts/generate.ts
rename to scripts/inference-providers/scripts/generate.ts
index 98254a84e..ad09a3418 100644
--- a/scripts/api-inference/scripts/generate.ts
+++ b/scripts/inference-providers/scripts/generate.ts
@@ -58,7 +58,7 @@ const ROOT_DIR = path
   .replace(/^(file:)/, "");
 const TEMPLATE_DIR = path.join(ROOT_DIR, "templates");
 const DOCS_DIR = path.join(ROOT_DIR, "..", "..", "docs");
-const TASKS_DOCS_DIR = path.join(DOCS_DIR, "api-inference", "tasks");
+const TASKS_DOCS_DIR = path.join(DOCS_DIR, "inference-providers", "tasks");
 
 const NBSP = "&nbsp;"; // non-breaking space
 const TABLE_INDENT = NBSP.repeat(8);
diff --git a/scripts/api-inference/templates/common/page-header.handlebars b/scripts/inference-providers/templates/common/page-header.handlebars
similarity index 86%
rename from scripts/api-inference/templates/common/page-header.handlebars
rename to scripts/inference-providers/templates/common/page-header.handlebars
index 54aa6c861..cac3aa06d 100644
--- a/scripts/api-inference/templates/common/page-header.handlebars
+++ b/scripts/inference-providers/templates/common/page-header.handlebars
@@ -1,7 +1,7 @@
 This markdown file has been generated from a script. Please do not edit it directly.
 For more details, check out:
-- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/api-inference/scripts/generate.ts
-- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/api-inference/templates/task/{{task}}.handlebars
+- the `generate.ts` script: https://github.com/huggingface/hub-docs/blob/main/scripts/inference-providers/scripts/generate.ts
+- the task template defining the sections in the page: https://github.com/huggingface/hub-docs/tree/main/scripts/inference-providers/templates/task/{{task}}.handlebars
 - the input jsonschema specifications used to generate the input markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/{{task}}/spec/input.json
 - the output jsonschema specifications used to generate the output markdown table: https://github.com/huggingface/huggingface.js/blob/main/packages/tasks/src/tasks/{{task}}/spec/output.json
 - the snippets used to generate the example:
diff --git a/scripts/api-inference/templates/common/snippets-template.handlebars b/scripts/inference-providers/templates/common/snippets-template.handlebars
similarity index 100%
rename from scripts/api-inference/templates/common/snippets-template.handlebars
rename to scripts/inference-providers/templates/common/snippets-template.handlebars
diff --git a/scripts/api-inference/templates/common/specs-headers.handlebars b/scripts/inference-providers/templates/common/specs-headers.handlebars
similarity index 100%
rename from scripts/api-inference/templates/common/specs-headers.handlebars
rename to scripts/inference-providers/templates/common/specs-headers.handlebars
diff --git a/scripts/api-inference/templates/common/specs-output.handlebars b/scripts/inference-providers/templates/common/specs-output.handlebars
similarity index 100%
rename from scripts/api-inference/templates/common/specs-output.handlebars
rename to scripts/inference-providers/templates/common/specs-output.handlebars
diff --git a/scripts/api-inference/templates/common/specs-payload.handlebars b/scripts/inference-providers/templates/common/specs-payload.handlebars
similarity index 100%
rename from scripts/api-inference/templates/common/specs-payload.handlebars
rename to scripts/inference-providers/templates/common/specs-payload.handlebars
diff --git a/scripts/api-inference/templates/task/audio-classification.handlebars b/scripts/inference-providers/templates/task/audio-classification.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/audio-classification.handlebars
rename to scripts/inference-providers/templates/task/audio-classification.handlebars
diff --git a/scripts/api-inference/templates/task/automatic-speech-recognition.handlebars b/scripts/inference-providers/templates/task/automatic-speech-recognition.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/automatic-speech-recognition.handlebars
rename to scripts/inference-providers/templates/task/automatic-speech-recognition.handlebars
diff --git a/scripts/api-inference/templates/task/chat-completion.handlebars b/scripts/inference-providers/templates/task/chat-completion.handlebars
similarity index 94%
rename from scripts/api-inference/templates/task/chat-completion.handlebars
rename to scripts/inference-providers/templates/task/chat-completion.handlebars
index 610327e33..da32ea5f1 100644
--- a/scripts/api-inference/templates/task/chat-completion.handlebars
+++ b/scripts/inference-providers/templates/task/chat-completion.handlebars
@@ -1,7 +1,7 @@
 ## Chat Completion
 
 Generate a response given a list of messages in a conversational context, supporting both conversational Language Models (LLMs) and conversational Vision-Language Models (VLMs).
-This is a subtask of [`text-generation`](https://huggingface.co/docs/api-inference/tasks/text-generation) and [`image-text-to-text`](https://huggingface.co/docs/api-inference/tasks/image-text-to-text).
+This is a subtask of [`text-generation`](https://huggingface.co/docs/inference-providers/tasks/text-generation) and [`image-text-to-text`](https://huggingface.co/docs/inference-providers/tasks/image-text-to-text).
 
 ### Recommended models
 
diff --git a/scripts/api-inference/templates/task/feature-extraction.handlebars b/scripts/inference-providers/templates/task/feature-extraction.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/feature-extraction.handlebars
rename to scripts/inference-providers/templates/task/feature-extraction.handlebars
diff --git a/scripts/api-inference/templates/task/fill-mask.handlebars b/scripts/inference-providers/templates/task/fill-mask.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/fill-mask.handlebars
rename to scripts/inference-providers/templates/task/fill-mask.handlebars
diff --git a/scripts/api-inference/templates/task/image-classification.handlebars b/scripts/inference-providers/templates/task/image-classification.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/image-classification.handlebars
rename to scripts/inference-providers/templates/task/image-classification.handlebars
diff --git a/scripts/api-inference/templates/task/image-segmentation.handlebars b/scripts/inference-providers/templates/task/image-segmentation.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/image-segmentation.handlebars
rename to scripts/inference-providers/templates/task/image-segmentation.handlebars
diff --git a/scripts/api-inference/templates/task/image-text-to-text.handlebars b/scripts/inference-providers/templates/task/image-text-to-text.handlebars
similarity index 90%
rename from scripts/api-inference/templates/task/image-text-to-text.handlebars
rename to scripts/inference-providers/templates/task/image-text-to-text.handlebars
index 8aa03f37e..e46408714 100644
--- a/scripts/api-inference/templates/task/image-text-to-text.handlebars
+++ b/scripts/inference-providers/templates/task/image-text-to-text.handlebars
@@ -18,6 +18,6 @@ Image-text-to-text models take in an image and text prompt and output text. Thes
 
 ### API specification
 
-For the API specification of conversational image-text-to-text models, please refer to the [Chat Completion API documentation](https://huggingface.co/docs/api-inference/tasks/chat-completion#api-specification).
+For the API specification of conversational image-text-to-text models, please refer to the [Chat Completion API documentation](https://huggingface.co/docs/inference-providers/tasks/chat-completion#api-specification).
 
 
diff --git a/scripts/api-inference/templates/task/image-to-image.handlebars b/scripts/inference-providers/templates/task/image-to-image.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/image-to-image.handlebars
rename to scripts/inference-providers/templates/task/image-to-image.handlebars
diff --git a/scripts/api-inference/templates/task/object-detection.handlebars b/scripts/inference-providers/templates/task/object-detection.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/object-detection.handlebars
rename to scripts/inference-providers/templates/task/object-detection.handlebars
diff --git a/scripts/api-inference/templates/task/question-answering.handlebars b/scripts/inference-providers/templates/task/question-answering.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/question-answering.handlebars
rename to scripts/inference-providers/templates/task/question-answering.handlebars
diff --git a/scripts/api-inference/templates/task/summarization.handlebars b/scripts/inference-providers/templates/task/summarization.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/summarization.handlebars
rename to scripts/inference-providers/templates/task/summarization.handlebars
diff --git a/scripts/api-inference/templates/task/table-question-answering.handlebars b/scripts/inference-providers/templates/task/table-question-answering.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/table-question-answering.handlebars
rename to scripts/inference-providers/templates/task/table-question-answering.handlebars
diff --git a/scripts/api-inference/templates/task/text-classification.handlebars b/scripts/inference-providers/templates/task/text-classification.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/text-classification.handlebars
rename to scripts/inference-providers/templates/task/text-classification.handlebars
diff --git a/scripts/api-inference/templates/task/text-generation.handlebars b/scripts/inference-providers/templates/task/text-generation.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/text-generation.handlebars
rename to scripts/inference-providers/templates/task/text-generation.handlebars
diff --git a/scripts/api-inference/templates/task/text-to-image.handlebars b/scripts/inference-providers/templates/task/text-to-image.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/text-to-image.handlebars
rename to scripts/inference-providers/templates/task/text-to-image.handlebars
diff --git a/scripts/api-inference/templates/task/token-classification.handlebars b/scripts/inference-providers/templates/task/token-classification.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/token-classification.handlebars
rename to scripts/inference-providers/templates/task/token-classification.handlebars
diff --git a/scripts/api-inference/templates/task/translation.handlebars b/scripts/inference-providers/templates/task/translation.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/translation.handlebars
rename to scripts/inference-providers/templates/task/translation.handlebars
diff --git a/scripts/api-inference/templates/task/zero-shot-classification.handlebars b/scripts/inference-providers/templates/task/zero-shot-classification.handlebars
similarity index 100%
rename from scripts/api-inference/templates/task/zero-shot-classification.handlebars
rename to scripts/inference-providers/templates/task/zero-shot-classification.handlebars
diff --git a/scripts/api-inference/tsconfig.json b/scripts/inference-providers/tsconfig.json
similarity index 100%
rename from scripts/api-inference/tsconfig.json
rename to scripts/inference-providers/tsconfig.json