huggingface
diff --git a/‎.github/workflows/sagemaker_build_documentation.yml‎
Lines changed: 8 additions & 4 deletions b/‎.github/workflows/sagemaker_build_documentation.yml‎
Lines changed: 8 additions & 4 deletions
diff --git a/‎.github/workflows/sagemaker_build_pr_documentation.yml‎
Lines changed: 5 additions & 3 deletions b/‎.github/workflows/sagemaker_build_pr_documentation.yml‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎.github/workflows/sagemaker_delete_doc_comment.yml‎
Lines changed: 1 addition & 2 deletions b/‎.github/workflows/sagemaker_delete_doc_comment.yml‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎.github/workflows/sagemaker_upload_pr_documentation.yml‎
Lines changed: 3 additions & 3 deletions b/‎.github/workflows/sagemaker_upload_pr_documentation.yml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎docs/hub/_toctree.yml‎
Lines changed: 5 additions & 1 deletion b/‎docs/hub/_toctree.yml‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎docs/hub/academia-hub.md‎
Lines changed: 1 addition & 1 deletion b/‎docs/hub/academia-hub.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/hub/advanced-compute-options.md‎
Lines changed: 4 additions & 4 deletions b/‎docs/hub/advanced-compute-options.md‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎docs/hub/agents.md‎
Lines changed: 139 additions & 12 deletions b/‎docs/hub/agents.md‎
Lines changed: 139 additions & 12 deletions
diff --git a/‎docs/hub/api.md‎
Lines changed: 1 addition & 1 deletion b/‎docs/hub/api.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/hub/audit-logs.md‎
Lines changed: 1 addition & 1 deletion b/‎docs/hub/audit-logs.md‎
Lines changed: 1 addition & 1 deletion
@@ -1,11 +1,13 @@
-name: Build sagemaker documentation
+name: Build SageMaker Documentation
 
 on:
   push:
-    paths:
-      - "docs/sagemaker/**"
     branches:
       - main
+      - doc-builder*
+    paths:
+      - docs/sagemaker/**
+      - .github/workflows/sagemaker_build_documentation.yaml
 
 jobs:
    build:
@@ -14,7 +16,9 @@ jobs:
       commit_sha: ${{ github.sha }}
       package: hub-docs
       package_name: sagemaker
-      path_to_docs: hub-docs/docs/sagemaker/
+      path_to_docs: hub-docs/docs/sagemaker/source
       additional_args: --not_python_module
+      pre_command: cd hub-docs/docs/sagemaker && make docs
     secrets:
+      token: ${{ secrets.HUGGINGFACE_PUSH }}
       hf_token: ${{ secrets.HF_DOC_BUILD_PUSH }}
@@ -1,9 +1,10 @@
-name: Build sagemaker PR Documentation
+name: Build SageMaker PR Documentation
 
 on:
   pull_request:
     paths:
-      - "docs/sagemaker/**"
+      - docs/sagemaker/**
+      - .github/workflows/sagemaker_build_pr_documentation.yaml
 
 concurrency:
   group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }}
@@ -17,5 +18,6 @@ jobs:
       pr_number: ${{ github.event.number }}
       package: hub-docs
       package_name: sagemaker
-      path_to_docs: hub-docs/docs/sagemaker/
+      path_to_docs: hub-docs/docs/sagemaker/source
       additional_args: --not_python_module
+      pre_command: cd hub-docs/docs/sagemaker && make docs
@@ -1,10 +1,9 @@
-name: Delete sagemaker doc comment trigger
+name: Delete SageMaker PR Documentation Comment
 
 on:
   pull_request:
     types: [ closed ]
 
-
 jobs:
   delete:
     uses: huggingface/doc-builder/.github/workflows/delete_doc_comment_trigger.yml@main
 
@@ -1,8 +1,8 @@
-name: Upload sagemaker PR Documentation
+name: Upload SageMaker PR Documentation
 
 on:
   workflow_run:
-    workflows: ["Build sagemaker PR Documentation"]
+    workflows: ["Build SageMaker PR Documentation"]
     types:
       - completed
 
@@ -13,4 +13,4 @@ jobs:
       package_name: sagemaker
     secrets:
       hf_token: ${{ secrets.HF_DOC_BUILD_PUSH }}
-      comment_bot_token: ${{ secrets.COMMENT_BOT_TOKEN }}
+      comment_bot_token: ${{ secrets.COMMENT_BOT_TOKEN }}
@@ -254,6 +254,8 @@
     title: Spaces Dev Mode
   - local: spaces-storage
     title: Spaces Persistent Storage
+  - local: spaces-mcp-servers
+    title: Spaces as MCP servers
   - local: spaces-sdks-gradio
     title: Gradio Spaces
   - local: spaces-sdks-streamlit
@@ -342,12 +344,14 @@
     sections:
     - local: enterprise-sso
       title: Single Sign-On (SSO)
+    - local: enterprise-hub-advanced-sso
+      title: Advanced Single Sign-On (SSO)
     - local: audit-logs
       title: Audit Logs
     - local: storage-regions
       title: Storage Regions
     - local: enterprise-hub-datasets
-      title: Dataset viewer for Private datasets
+      title: Data Studio for Private datasets
     - local: enterprise-hub-resource-groups
       title: Resource Groups (Access Control)
     - local: advanced-compute-options
 
@@ -22,7 +22,7 @@ Academia Hub is designed for:
 Key Features of Academia Hub:
 
 - **ZeroGPU:** Get 5x usage quota and highest GPU queue priority.
-- **Spaces Hosting:** Create ZeroGPU Spaces with A100 hardware.
+- **Spaces Hosting:** Create ZeroGPU Spaces with H200 hardware.
 - **Spaces Dev Mode:** Fast iterations via SSH/VS Code for Spaces.
 - **Inference Providers:** Get monthly included credits across all Inference Providers.
 - **Dataset Viewer:** Activate it on private datasets.
 
@@ -1,14 +1,14 @@
 # Advanced Compute Options
 
 <Tip warning={true}>
-This feature is part of the <a href="https://huggingface.co/enterprise">Enterprise Hub</a>.
+This feature is part of the <a href="https://huggingface.co/enterprise">Team & Enterprise</a> plans.
 </Tip>
 
 Enterprise Hub organizations gain access to advanced compute options to accelerate their machine learning journey.
 
 ## Host ZeroGPU Spaces in your organization
 
-ZeroGPU is a dynamic GPU allocation system that optimizes AI deployment on Hugging Face Spaces. By automatically allocating and releasing NVIDIA A100 GPUs (40GB VRAM) as needed, organizations can efficiently serve their AI applications without dedicated GPU instances.
+ZeroGPU is a dynamic GPU allocation system that optimizes AI deployment on Hugging Face Spaces. By automatically allocating and releasing NVIDIA H200 GPU slices (70GB VRAM) as needed, organizations can efficiently serve their AI applications without dedicated GPU instances.
 
 <div class="flex justify-center" style="max-width: 550px">
   <img
@@ -25,9 +25,9 @@ ZeroGPU is a dynamic GPU allocation system that optimizes AI deployment on Huggi
 
 **Key benefits for organizations**
 
-- **Free GPU Access**: Access powerful NVIDIA A100 GPUs at no additional cost through dynamic allocation
+- **Free GPU Access**: Access powerful NVIDIA H200 GPUs at no additional cost through dynamic allocation
 - **Enhanced Resource Management**: Host up to 50 ZeroGPU Spaces for efficient team-wide AI deployment
 - **Simplified Deployment**: Easy integration with PyTorch-based models, Gradio apps, and other Hugging Face libraries
-- **Enterprise-Grade Infrastructure**: Access to high-performance NVIDIA A100 GPUs with 40GB VRAM per workload
+- **Enterprise-Grade Infrastructure**: Access to high-performance NVIDIA H200 GPUs with 70GB VRAM per workload
 
 [Learn more about ZeroGPU →](https://huggingface.co/docs/hub/spaces-zerogpu)
@@ -1,6 +1,28 @@
 # Agents on the Hub
 
-This page compiles all the libraries and tools Hugging Face offers for agentic workflows: huggingface.js mcp-client, Gradio MCP Server and smolagents.
+This page compiles all the libraries and tools Hugging Face offers for agentic workflows: 
+- `HF MCP Server`: Connect your MCP-compatible AI assistant directly to the Hugging Face Hub.
+- `tiny-agents`: A lightweight toolkit for MCP-powered agents, available in both JS (`@huggingface/tiny-agents`) and Python (`huggingface_hub`).
+- `Gradio MCP Server`: Easily create MCP servers from Gradio apps and Spaces.
+- `smolagents`: a Python library that enables you to run powerful agents in a few lines of code.
+
+## HF MCP Server
+
+The official **Hugging Face MCP (Model Context Protocol) Server** enables seamless integration between the Hugging Face Hub and any MCP-compatible AI assistant—including VSCode, Cursor, and Claude Desktop.
+
+With the HF MCP Server, you can enhance your AI assistant's capabilities by connecting directly to the Hub's ecosystem. It comes with:
+- a curated set of **built-in tools** like Spaces and Papers Semantic Search, Model and Dataset exploration, etc
+- **MCP-compatible Gradio apps**: Connect to any [MCP-compatible Gradio app](https://huggingface.co/spaces?filter=mcp-server) built by the Hugging Face community
+
+#### Getting Started
+
+Visit [huggingface.co/settings/mcp](https://huggingface.co/settings/mcp) to configure your MCP client and get started.
+
+<Tip warning={true}>
+
+This feature is experimental ⚗️ and will continue to evolve.
+
+</Tip>
 
 ## smolagents
 
@@ -43,27 +65,132 @@ with MCPClient(server_parameters) as tools:
 
 Learn more [in the documentation](https://huggingface.co/docs/smolagents/tutorials/tools#use-mcp-tools-with-mcpclient-directly).
 
-## huggingface.js mcp-client
+## tiny-agents (JS and Python)
+
+`tiny-agents` is a lightweight toolkit for running and building MCP-powered agents on top of the Hugging Face Inference Client + Model Context Protocol (MCP). It is available as a JS package `@huggingface/tiny-agents` and in the `huggingface_hub` Python package.
+
+
+### @huggingface/tiny-agents (JS)
+
+The `@huggingface/tiny-agents` package offers a simple and straightforward CLI and a simple programmatic API for running and building MCP-powered agents in JS.
 
-Huggingface.js offers an MCP client served with [Inference Providers](https://huggingface.co/docs/inference-providers/en/index) or local LLMs. Getting started with them is as simple as running `pnpm agent`. You can plug and play different models and providers by setting `PROVIDER` and `MODEL_ID` environment variables. 
 
+**Getting Started**
+
+First, you need to install the package:
+
+```bash
+npm install @huggingface/tiny-agents
+# or
+pnpm add @huggingface/tiny-agents
+```
+
+Then, you can your agent:
 ```bash
-export HF_TOKEN="hf_..."
-export MODEL_ID="Qwen/Qwen2.5-72B-Instruct"
-export PROVIDER="nebius"
-npx @huggingface/mcp-client
+npx @huggingface/tiny-agents [command] "agent/id"
+
+Usage:
+  tiny-agents [flags]
+  tiny-agents run   "agent/id"
+  tiny-agents serve "agent/id"
+
+Available Commands:
+  run         Run the Agent in command-line
+  serve       Run the Agent as an OpenAI-compatible HTTP server
 ```
 
-or, you can use any Local LLM (for example via lmstudio):
+You can load agents directly from the [tiny-agents](https://huggingface.co/datasets/tiny-agents/tiny-agents) Dataset, or specify a path to your own local agent configuration.
+
+**Advanced Usage**
+In addition to the CLI, you can use the `Agent` class for more fine-grained control. For lower-level interactions, use the `MCPClient` from the `@huggingface/mcp-client` package to connect directly to MCP servers and manage tool calls.
+
+Learn more about tiny-agents in the [huggingface.js documentation](https://huggingface.co/docs/huggingface.js/en/tiny-agents/README). 
+
+### huggingface_hub (Python)
+
+The `huggingface_hub` library is the easiest way to run MCP-powered agents in Python. It includes a high-level `tiny-agents` CLI as well as programmatic access via the `Agent` and `MCPClient` classes — all built to work with [Hugging Face Inference Providers](https://huggingface.co/docs/inference-providers/index), local LLMs, or any inference endpoint compatible with OpenAI's API specs.
+
+**Getting started**
 
+Install the latest version with MCP support:
 ```bash
-ENDPOINT_URL=http://localhost:1234/v1 \
-MODEL_ID=lmstudio-community/Qwen3-14B-GGUF \
-npx @huggingface/mcp-client
+pip install "huggingface_hub[mcp]>=0.32.2"
 ```
+Then, you can run your agent:
+```bash
+> tiny-agents run --help
+                                                                                                                                                                                     
+ Usage: tiny-agents run [OPTIONS] [PATH] COMMAND [ARGS]...                                                                                                                           
+                                                                                                                                                                                     
+ Run the Agent in the CLI                                                                                                                                                            
+                                                                                                                                                                                     
+                                                                                                                                                                                     
+╭─ Arguments ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮
+│   path      [PATH]  Path to a local folder containing an agent.json file or a built-in agent stored in the 'tiny-agents/tiny-agents' Hugging Face dataset                         │
+│                     (https://huggingface.co/datasets/tiny-agents/tiny-agents)                                                                                                     │
+╰───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯
+╭─ Options ─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮
+│ --help          Show this message and exit.                                                                                                                                       │
+╰───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯
+
+```
+
+The CLI pulls the config, connects to its MCP servers, prints the available tools, and waits for your prompt.
+
+**Advanced Usage**
+
+For more fine-grained control, use the `MCPClient` directly. This low-level interface extends `AsyncInferenceClient` and allows LLMs to call tools via the Model Context Protocol (MCP). It supports both local (`stdio`) and remote (`http`/`sse`) MCP servers, handles tool registration and execution, and streams results back to the model in real-time.
+
+Learn more in the [`huggingface_hub` MCP documentation](https://huggingface.co/docs/huggingface_hub/main/en/package_reference/mcp).
+
+
+### Custom Agents
+
+To create your own agent, simply create a folder (e.g., `my-agent/`) and define your agent’s configuration in an `agent.json` file.
+The following example shows a web-browsing agent configured to use the [Qwen/Qwen2.5-72B-Instruct](https://huggingface.co/Qwen/Qwen2.5-72B-Instruct) model via Nebius inference provider, and it comes equipped with a playwright MCP server, which lets it use a web browser
+
+```json
+{
+	"model": "Qwen/Qwen2.5-72B-Instruct",
+	"provider": "nebius",
+	"servers": [
+		{
+			"type": "stdio",
+			"config": {
+				"command": "npx",
+				"args": ["@playwright/mcp@latest"]
+			}
+		}
+	]
+}
+```
+
+To use a local LLM (such as [llama.cpp](https://github.com/ggerganov/llama.cpp), or [LM Studio](https://lmstudio.ai/)), just provide an `endpointUrl`:
+
+```json
+{
+	"model": "Qwen/Qwen3-32B",
+	"endpointUrl": "http://localhost:1234/v1",
+	"servers": [
+		{
+			"type": "stdio",
+			"config": {
+				"command": "npx",
+				"args": ["@playwright/mcp@latest"]
+			}
+		}
+	]
+}
+
+```
+
+Optionally, add a `PROMPT.md` to customize the system prompt.
+
+<Tip>
 
-You can get more information about mcp-client [here](https://huggingface.co/docs/huggingface.js/en/mcp-client/README).
+Don't hesitate to contribute your agent to the community by opening a Pull Request in the [tiny-agents](https://huggingface.co/datasets/tiny-agents/tiny-agents) Hugging Face dataset.
 
+</Tip>
 
 ## Gradio MCP Server / Tools
 
 
@@ -1,6 +1,6 @@
 # Hub API Endpoints
 
-We have open endpoints that you can use to retrieve information from the Hub as well as perform certain actions such as creating model, dataset or Space repos. We offer a wrapper Python library, [`huggingface_hub`](https://github.com/huggingface/huggingface_hub), that allows easy access to these endpoints. We also provide [webhooks](./webhooks) to receive real-time incremental info about repos. Enjoy!
+We have open endpoints that you can use to retrieve information from the Hub as well as perform certain actions such as creating model, dataset or Space repos. We offer a wrapper Python client, [`huggingface_hub`](https://github.com/huggingface/huggingface_hub), and a JS client, [`huggingface.js`](https://github.com/huggingface/huggingface.js), that allow easy access to these endpoints. We also provide [webhooks](./webhooks) to receive real-time incremental info about repos. Enjoy!
 
 The base URL for those endpoints below is `https://huggingface.co`. For example, to construct the `/api/models` call below, one can call the URL [https://huggingface.co/api/models](https://huggingface.co/api/models)
 
 
@@ -1,7 +1,7 @@
 # Audit Logs
 
 <Tip warning={true}>
-This feature is part of the <a href="https://huggingface.co/enterprise">Enterprise Hub</a>.
+This feature is part of the <a href="https://huggingface.co/enterprise">Team & Enterprise</a> plans.
 </Tip>
 
 Audit Logs enable organization admins to easily review actions taken by members, including organization membership, repository settings and billing changes.