MicrosoftDocs
diff --git a/‎.openpublishing.redirection.json‎
Lines changed: 167 additions & 2 deletions b/‎.openpublishing.redirection.json‎
Lines changed: 167 additions & 2 deletions
diff --git a/‎articles/ai-foundry/model-inference/breadcrumb/toc.yml‎ renamed to ‎articles/ai-foundry/foundry-models/breadcrumb/toc.yml‎
Lines changed: 2 additions & 2 deletions b/‎articles/ai-foundry/model-inference/breadcrumb/toc.yml‎ renamed to ‎articles/ai-foundry/foundry-models/breadcrumb/toc.yml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎articles/ai-foundry/model-inference/concepts/content-filter.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/content-filter.md‎
Lines changed: 1 addition & 1 deletion b/‎articles/ai-foundry/model-inference/concepts/content-filter.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/content-filter.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎articles/ai-foundry/model-inference/concepts/default-safety-policies.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/default-safety-policies.md‎
Lines changed: 3 additions & 3 deletions b/‎articles/ai-foundry/model-inference/concepts/default-safety-policies.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/default-safety-policies.md‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎articles/ai-foundry/model-inference/concepts/deployment-types.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/deployment-types.md‎
Lines changed: 2 additions & 2 deletions b/‎articles/ai-foundry/model-inference/concepts/deployment-types.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/deployment-types.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎articles/ai-foundry/model-inference/concepts/endpoints.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/endpoints.md‎
Lines changed: 9 additions & 9 deletions b/‎articles/ai-foundry/model-inference/concepts/endpoints.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/endpoints.md‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎articles/ai-foundry/model-inference/concepts/model-versions.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/model-versions.md‎ b/‎articles/ai-foundry/model-inference/concepts/model-versions.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/model-versions.md‎
diff --git a/‎articles/ai-foundry/model-inference/concepts/models.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/models.md‎
Lines changed: 5 additions & 5 deletions b/‎articles/ai-foundry/model-inference/concepts/models.md‎ renamed to ‎articles/ai-foundry/foundry-models/concepts/models.md‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎articles/ai-foundry/model-inference/context/context.yml‎ renamed to ‎articles/ai-foundry/foundry-models/context/context.yml‎ b/‎articles/ai-foundry/model-inference/context/context.yml‎ renamed to ‎articles/ai-foundry/foundry-models/context/context.yml‎
@@ -1,4 +1,4 @@
-{ 
+{
   "redirections": [
     {
       "source_path": "articles/ai-foundry/concepts/connections.md",
@@ -319,6 +319,171 @@
       "source_path_from_root": "/articles/ai-services/language-service/tutorials/prompt-flow.md",
       "redirect_url": "/azure/ai-services/language-service/tutorials/power-automate",
       "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/concepts/content-filter.md",
+      "redirect_url": "../../foundry-models/concepts/content-filter",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/concepts/default-safety-policies.md",
+      "redirect_url": "../../foundry-models/concepts/default-safety-policies",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/concepts/deployment-types.md",
+      "redirect_url": "../../foundry-models/concepts/deployment-types",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/concepts/endpoints.md",
+      "redirect_url": "../../foundry-models/concepts/endpoints",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/concepts/models.md",
+      "redirect_url": "../../foundry-models/concepts/models",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/concepts/model-versions.md",
+      "redirect_url": "../../foundry-models/concepts/model-versions",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/configure-content-filters.md",
+      "redirect_url": "../../foundry-models/how-to/configure-content-filters",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/configure-deployment-policies.md",
+      "redirect_url": "../../foundry-models/how-to/configure-deployment-policies",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/configure-entra-id.md",
+      "redirect_url": "../../foundry-models/how-to/configure-entra-id",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/configure-marketplace.md",
+      "redirect_url": "../../foundry-models/how-to/configure-marketplace",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/configure-project-connection.md",
+      "redirect_url": "../../foundry-models/how-to/configure-project-connection",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/create-model-deployments.md",
+      "redirect_url": "../../foundry-models/how-to/create-model-deployments",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/inference.md",
+      "redirect_url": "../../foundry-models/how-to/inference",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/manage-costs.md",
+      "redirect_url": "../../foundry-models/how-to/manage-costs",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/monitor-models.md",
+      "redirect_url": "../../foundry-models/how-to/monitor-models",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/quickstart-ai-project.md",
+      "redirect_url": "../../foundry-models/how-to/quickstart-ai-project",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/quickstart-create-resources.md",
+      "redirect_url": "../../foundry-models/how-to/quickstart-create-resources",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/quickstart-github-models.md",
+      "redirect_url": "../../foundry-models/how-to/quickstart-github-models",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/use-blocklists.md",
+      "redirect_url": "../../foundry-models/how-to/use-blocklists",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/use-chat-completions.md",
+      "redirect_url": "../../foundry-models/how-to/use-chat-completions",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/use-chat-multi-modal.md",
+      "redirect_url": "../../foundry-models/how-to/use-chat-multi-modal",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/use-chat-reasoning.md",
+      "redirect_url": "../../foundry-models/how-to/use-chat-reasoning",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/use-embeddings.md",
+      "redirect_url": "../../foundry-models/how-to/use-embeddings",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/use-image-embeddings.md",
+      "redirect_url": "../../foundry-models/how-to/use-image-embeddings",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/use-structured-outputs.md",
+      "redirect_url": "../../foundry-models/how-to/use-structured-outputs",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/how-to/github/create-model-deployments.md",
+      "redirect_url": "../../../foundry-models/how-to/github/create-model-deployments",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/tutorials/get-started-deepseek-r1.md",
+      "redirect_url": "../../foundry-models/tutorials/get-started-deepseek-r1",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/overview.md",
+      "redirect_url": "../foundry-models/overview",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/quotas-limits.md",
+      "redirect_url": "../foundry-models/quotas-limits",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/supported-languages.md",
+      "redirect_url": "../foundry-models/supported-languages",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/supported-languages-openai.md",
+      "redirect_url": "../foundry-models/supported-languages-openai",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/faq.yml",
+      "redirect_url": "../foundry-models/faq",
+      "redirect_document_id": false
+    },
+    {
+      "source_path": "articles/ai-foundry/model-inference/index.yml",
+      "redirect_url": "../foundry-models/index",
+      "redirect_document_id": false
     }
   ]
-}
+}
@@ -7,5 +7,5 @@
     topicHref: /azure/ai-studio/index
     items:
     - name: Foundry Models
-      tocHref: /azure/ai-foundry/model-inference/
-      topicHref: /azure/ai-foundry/model-inference/index
+      tocHref: /azure/ai-foundry/foundry-models/
+      topicHref: /azure/ai-foundry/foundry-models/index
@@ -80,7 +80,7 @@ Detecting indirect attacks requires using document delimiters when constructing
 
 ## Configurability
 
-[!INCLUDE [content-filter-configurability](../includes/content-filter-configurability.md)]
+[!INCLUDE [content-filter-configurability](../../foundry-models/includes/content-filter-configurability.md)]
 
 ## Scenario details
 
 
@@ -16,12 +16,12 @@ reviewer: santiagxf
 
 Azure AI Foundry Models includes default safety applied to all models, excluding Azure OpenAI Whisper. These configurations provide you with a responsible experience by default.
 
-Default safety aims to mitigate risks such as hate and fairness, sexual, violence, self-harm, protected material content, and user prompt injection attacks. To learn more about content filtering, read [our documentation describing categories and severity levels](content-filter.md).
+Default safety aims to mitigate risks such as hate and fairness, sexual, violence, self-harm, protected material content, and user prompt injection attacks. To learn more about content filtering, read [our documentation describing categories and severity levels](../../model-inference/concepts/content-filter.md).
 
 This document describes the default configuration.
 
 > [!TIP]
-> By default, all model deployments use the default configuration. However, you can configure content filtering per model deployment as explained at [Configuring content filtering](../how-to/configure-content-filters.md).
+> By default, all model deployments use the default configuration. However, you can configure content filtering per model deployment as explained at [Configuring content filtering](../../model-inference/how-to/configure-content-filters.md).
 
 ## Text models
 
@@ -80,4 +80,4 @@ Content filters apply only to text prompts and completions. Images aren't subjec
 
 ## Next steps
 
-* [Configure content filters in Azure AI Foundry Models](../how-to/configure-content-filters.md)
+* [Configure content filters in Azure AI Foundry Models](../../model-inference/how-to/configure-content-filters.md)
@@ -33,7 +33,7 @@ Azure AI Foundry Models provides customers with choices on the hosting structure
 
 Global deployments are available in the same Azure AI Foundry Services as non-global deployment types but allow you to leverage Azure's global infrastructure to dynamically route traffic to the data center with best availability for each request.  Global standard provides the highest default quota and eliminates the need to load balance across multiple resources.  
 
-Customers with high consistent volume may experience greater latency variability. The threshold is set per model. See the [quotas page to learn more](../quotas-limits.md).  For applications that require the lower latency variance at large workload usage, we recommend purchasing provisioned throughput.
+Customers with high consistent volume may experience greater latency variability. The threshold is set per model. See the [quotas page to learn more](../../model-inference/quotas-limits.md).  For applications that require the lower latency variance at large workload usage, we recommend purchasing provisioned throughput.
 
 ## Global provisioned
 
@@ -119,5 +119,5 @@ Administrators can control which model deployment types are available to their u
 
 ## Related content
 
-- [Quotas & limits](../quotas-limits.md)
+- [Quotas & limits](../../model-inference/quotas-limits.md)
 - [Data privacy, and security for Azure AI Foundry Models](../../how-to/concept-data-privacy.md)
@@ -36,7 +36,7 @@ Deployments capture:
 
 An Azure AI Foundry resource can have as many model deployments as needed and they don't incur in cost unless inference is performed for those models. Deployments are Azure resources and hence they're subject to Azure policies.
 
-To learn more about how to create deployments see [Add and configure model deployments](../how-to/create-model-deployments.md).
+To learn more about how to create deployments see [Add and configure model deployments](../../model-inference/how-to/create-model-deployments.md).
 
 ## Endpoints
 
@@ -46,7 +46,7 @@ Azure AI Foundry Services (formerly known Azure AI Services) expose multiple end
 > * Azure AI inference endpoint (usually with the form `https://<resource-name>.services.ai.azure.com/models`)
 > * Azure OpenAI endpoint (usually with the form `https://<resource-name>.openai.azure.com`)
 
-The **Azure AI inference endpoint** allows customers to use a single endpoint with the same authentication and schema to generate inference for the deployed models in the resource. All the models support this capability. This endpoint follows the [Azure AI Model Inference API](.././reference/reference-model-inference-api.md). 
+The **Azure AI inference endpoint** allows customers to use a single endpoint with the same authentication and schema to generate inference for the deployed models in the resource. All the models support this capability. This endpoint follows the [Azure AI Model Inference API](../../model-inference/reference/reference-model-inference-api.md). 
 
 The **Azure OpenAI API** exposes the full capabilities of OpenAI models and supports more features like assistants, threads, files, and batch inference. Non-OpenAI models may also be exposed in this route.
 
@@ -60,21 +60,21 @@ The inference endpoint routes requests to a given deployment by matching the par
 
 For example, if you create a deployment named `Mistral-large`, then such deployment can be invoked as:
 
-[!INCLUDE [code-create-chat-client](../includes/code-create-chat-client.md)]
+[!INCLUDE [code-create-chat-client](../../foundry-models/includes/code-create-chat-client.md)]
 
 For a chat model, you can create a request as follows:
 
-[!INCLUDE [code-create-chat-completion](../includes/code-create-chat-completion.md)]
+[!INCLUDE [code-create-chat-completion](../../foundry-models/includes/code-create-chat-completion.md)]
 
-If you specify a model name that doesn't match any given model deployment, you get an error that the model doesn't exist. You can control which models are available for users by creating model deployments as explained at [add and configure model deployments](../how-to/create-model-deployments.md).
+If you specify a model name that doesn't match any given model deployment, you get an error that the model doesn't exist. You can control which models are available for users by creating model deployments as explained at [add and configure model deployments](../../model-inference/how-to/create-model-deployments.md).
 
 ## Key-less authentication
 
 Models deployed to Azure AI Foundry Models in Azure AI Services support key-less authorization using Microsoft Entra ID. Key-less authorization enhances security, simplifies the user experience, reduces operational complexity, and provides robust compliance support for modern development. It makes it a strong choice for organizations adopting secure and scalable identity management solutions.
 
-To use key-less authentication, [configure your resource and grant access to users](../how-to/configure-entra-id.md) to perform inference. Once configured, then you can authenticate as follows:
+To use key-less authentication, [configure your resource and grant access to users](../../model-inference/how-to/configure-entra-id.md) to perform inference. Once configured, then you can authenticate as follows:
 
-[!INCLUDE [code-create-chat-client-entra](../includes/code-create-chat-client-entra.md)]
+[!INCLUDE [code-create-chat-client-entra](../../foundry-models/includes/code-create-chat-client-entra.md)]
 
 ## Limitations
 
@@ -83,5 +83,5 @@ To use key-less authentication, [configure your resource and grant access to use
 
 ## Next steps
 
-- [Models](models.md)
-- [Deployment types](deployment-types.md)
+- [Models](../../model-inference/concepts/models.md)
+- [Deployment types](../../model-inference/concepts/deployment-types.md)
@@ -61,10 +61,10 @@ DeepSeek family of models includes DeepSeek-R1, which excels at reasoning tasks
 | ------ | ---- | ---- | ------------ |
 | [DeepSeek-R1-0528]() <br /> | chat-completion | Global standard | - **Input:** text (163,840 tokens) <br /> - **Output:** text (163,840 tokens) <br /> - **Languages:** `en` and `zh` <br />  - **Tool calling:** No  <br /> - **Response formats:** Text  |
 | [DeepSeek-V3-0324](https://ai.azure.com/explore/models/deepseek-v3-0324/version/1/registry/azureml-deepseek) | chat-completion | Global standard | - **Input:** text (131,072 tokens) <br /> - **Output:**  (131,072 tokens) <br /> - **Languages:** `en` and `zh` <br />  - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON |
-| [DeepSeek-R1](https://ai.azure.com/explore/models/deepseek-r1/version/1/registry/azureml-deepseek) | chat-completion <br /> [(with reasoning content)](../how-to/use-chat-reasoning.md) | Global standard | - **Input:** text (163,840 tokens) <br /> - **Output:**  (163,840 tokens) <br /> - **Languages:** `en` and `zh` <br />  - **Tool calling:** No <br /> - **Response formats:** Text. |
+| [DeepSeek-R1](https://ai.azure.com/explore/models/deepseek-r1/version/1/registry/azureml-deepseek) | chat-completion <br /> [(with reasoning content)](../../model-inference/how-to/use-chat-reasoning.md) | Global standard | - **Input:** text (163,840 tokens) <br /> - **Output:**  (163,840 tokens) <br /> - **Languages:** `en` and `zh` <br />  - **Tool calling:** No <br /> - **Response formats:** Text. |
 | [DeepSeek-V3](https://ai.azure.com/explore/models/deepseek-v3/version/1/registry/azureml-deepseek) <br />(Legacy) | chat-completion | Global standard | - **Input:** text (131,072 tokens) <br /> - **Output:**  (131,072 tokens) <br /> - **Languages:** `en` and `zh` <br />  - **Tool calling:** No <br /> - **Response formats:** Text, JSON |
 
-For a tutorial on DeepSeek-R1, see [Tutorial: Get started with DeepSeek-R1 reasoning model in Azure AI Foundry Models](../tutorials/get-started-deepseek-r1.md).
+For a tutorial on DeepSeek-R1, see [Tutorial: Get started with DeepSeek-R1 reasoning model in Azure AI Foundry Models](../../model-inference/tutorials/get-started-deepseek-r1.md).
 
 See [this model collection in Azure AI Foundry portal](https://ai.azure.com/explore/models?&selectedCollection=deepseek).
 
@@ -75,7 +75,7 @@ Microsoft models include various model groups such as MAI models, Phi models, he
 
 | Model  | Type | Tier | Capabilities |
 | ------ | ---- | --- | ------------ |
-| [MAI-DS-R1](https://ai.azure.com/explore/models/MAI-DS-R1/version/1/registry/azureml) |  chat-completion <br /> [(with reasoning content)](../how-to/use-chat-reasoning.md) | Global standard | - **Input:** text (163,840 tokens) <br /> - **Output:**  (163,840 tokens) <br /> - **Languages:** `en` and `zh` <br />  - **Tool calling:** No <br /> - **Response formats:** Text. |
+| [MAI-DS-R1](https://ai.azure.com/explore/models/MAI-DS-R1/version/1/registry/azureml) |  chat-completion <br /> [(with reasoning content)](../../model-inference/how-to/use-chat-reasoning.md) | Global standard | - **Input:** text (163,840 tokens) <br /> - **Output:**  (163,840 tokens) <br /> - **Languages:** `en` and `zh` <br />  - **Tool calling:** No <br /> - **Response formats:** Text. |
 
 ### Mistral AI
 
@@ -112,7 +112,7 @@ xAI's Grok 3 and Grok 3 Mini models are designed to excel in various enterprise
 
 Models from Partners and Community available for deployment with pay-as-you-go billing (for example, Cohere models) are offered by the model provider but hosted in Microsoft-managed Azure infrastructure and accessed via API in the Azure AI Foundry. Model providers define the license terms and set the price for use of their models, while Azure AI Foundry manages the hosting infrastructure.
 
-Models from Partners and Community are offered through Azure Marketplace and [requires additional configuration for enabling](../how-to/configure-marketplace.md). 
+Models from Partners and Community are offered through Azure Marketplace and [requires additional configuration for enabling](../../model-inference/how-to/configure-marketplace.md). 
 
 ### AI21 Labs
 
@@ -229,4 +229,4 @@ Those models can be of open access or IP protected. In both cases, you have to d
 
 ## Next steps
 
-- Get started today and [deploy your fist model in Azure AI Foundry Models](../how-to/create-model-deployments.md)
+- Get started today and [deploy your fist model in Azure AI Foundry Models](../../model-inference/how-to/create-model-deployments.md)