MicrosoftDocs
diff --git a/‎articles/ai-foundry/.openpublishing.redirection.ai-studio.json‎
Lines changed: 16 additions & 6 deletions b/‎articles/ai-foundry/.openpublishing.redirection.ai-studio.json‎
Lines changed: 16 additions & 6 deletions
diff --git a/‎articles/ai-foundry/concepts/model-lifecycle-retirement.md‎
Lines changed: 6 additions & 0 deletions b/‎articles/ai-foundry/concepts/model-lifecycle-retirement.md‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎articles/ai-foundry/concepts/models-featured.md‎
Lines changed: 11 additions & 5 deletions b/‎articles/ai-foundry/concepts/models-featured.md‎
Lines changed: 11 additions & 5 deletions
diff --git a/‎articles/ai-foundry/how-to/develop/connections-add-sdk.md‎
Lines changed: 1 addition & 1 deletion b/‎articles/ai-foundry/how-to/develop/connections-add-sdk.md‎
Lines changed: 1 addition & 1 deletion
@@ -110,6 +110,11 @@
             "redirect_url": "/azure/ai-foundry/how-to/data-add",
             "redirect_document_id": true
           },
+          {
+            "source_path_from_root": "/articles/ai-foundry/model-inference/reference/api-version-updates.md",
+            "redirect_url": "/rest/api/aifoundry/modelinference",
+            "redirect_document_id": false
+          },
           {
             "source_path_from_root": "/articles/ai-studio/how-to/deploy-models-cohere-command.md",
             "redirect_url": "/azure/ai-foundry/how-to/deploy-models-cohere-command",
@@ -699,8 +704,8 @@
         },
         {
             "source_path_from_root": "/articles/ai-studio/ai-services/how-to/connect-ai-services.md",
-            "redirect_url": "/azure/ai-foundry/ai-services/how-to/connect-ai-services",
-            "redirect_document_id": true
+            "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",
+            "redirect_document_id": false
         },
         {
             "source_path_from_root": "/articles/ai-studio/ai-services/how-to/connect-azure-openai.md",
@@ -875,7 +880,7 @@
         },
         {
             "source_path_from_root": "/articles/ai-studio/how-to/models-foundation-azure-ai.md",
-            "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",
+            "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",
             "redirect_document_id": true
         },
         {
@@ -955,17 +960,17 @@
         },
         {
             "source_path_from_root": "/articles/ai-studio/ai-services/get-started.md",
-            "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",
+            "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",
             "redirect_document_id": false
         },
         {
             "source_path_from_root": "/articles/ai-studio/ai-services/where-to-use-ai-services.md",
-            "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",
+            "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",
             "redirect_document_id": false
         },
         {
             "source_path_from_root": "/articles/ai-studio/ai-services/connect-ai-services.md",
-            "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",
+            "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",
             "redirect_document_id": false
         },
         {
@@ -1127,6 +1132,11 @@
             "source_path_from_root": "/articles/ai-foundry/how-to/prompt-flow.md",
             "redirect_url": "/azure/ai-foundry/concepts/prompt-flow",
             "redirect_document_id": true
+        },
+        {
+          "source_path_from_root": "/articles/ai-foundry/ai-services/how-to/connect-ai-services.md",
+          "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",
+          "redirect_document_id": false
         }
     ]
 }
@@ -80,6 +80,12 @@ The following tables list the timelines for models that are on track for retirem
 | [Cohere-rerank-v3-english](https://ai.azure.com/explore/models/Cohere-rerank-v3-english/version/1/registry/azureml-cohere) | February 28, 2025 | March 31, 2025 | June 30, 2025 | [Cohere-rerank-v3.5-english](https://ai.azure.com/explore/models/Cohere-rerank-v3.5/version/1/registry/azureml-cohere) |
 | [Cohere-rerank-v3-multilingual](https://ai.azure.com/explore/models/Cohere-rerank-v3-multilingual/version/1/registry/azureml-cohere) | February 28, 2025 | March 31, 2025 | June 30, 2025 | [Cohere-rerank-v3.5-multilingual](https://ai.azure.com/explore/models/Cohere-rerank-v3.5/version/1/registry/azureml-cohere) |
 
+#### DeepSeek
+
+| Model | Legacy date (UTC) | Deprecation date (UTC) | Retirement date (UTC) | Suggested replacement model |
+|-------|-------------------|------------------------|-----------------------|-----------------------------|
+| [DeepSeek-V3](https://aka.ms/azureai/landing/DeepSeek-V3) | April 10, 2025 | May 31, 2025 | August 31, 2025 | [DeepSeek-V3-0324](https://aka.ms/azureai/landing/DeepSeek-V3-0324) |
+
 #### Meta
 
 | Model | Legacy date (UTC) | Deprecation date (UTC) | Retirement date (UTC) | Suggested replacement model |
 
@@ -27,9 +27,9 @@ To perform inferencing with the models, some models such as [Nixtla's TimeGEN-1]
 
 The Jamba family models are AI21's production-grade Mamba-based large language model (LLM) which uses AI21's hybrid Mamba-Transformer architecture. It's an instruction-tuned version of AI21's hybrid structured state space model (SSM) transformer Jamba model. The Jamba family models are built for reliable commercial use with respect to quality and performance.
 
-| Model  | Type | Capabilities | 
-| ------ | ---- | --- | 
-| [AI21-Jamba-1.5-Mini](https://ai.azure.com/explore/models/AI21-Jamba-1.5-Mini/version/1/registry/azureml-ai21) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (262,144 tokens) <br /> - **Output:**  text (4,096 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON, structured outputs | | 
+| Model  | Type | Capabilities |
+| ------ | ---- | --- |
+| [AI21-Jamba-1.5-Mini](https://ai.azure.com/explore/models/AI21-Jamba-1.5-Mini/version/1/registry/azureml-ai21) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (262,144 tokens) <br /> - **Output:**  text (4,096 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON, structured outputs |
 | [AI21-Jamba-1.5-Large](https://ai.azure.com/explore/models/AI21-Jamba-1.5-Large/version/1/registry/azureml-ai21) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (262,144 tokens) <br /> - **Output:**  text (4,096 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON, structured outputs |
 
 
@@ -68,10 +68,12 @@ The following table lists the Cohere models that you can inference via the  Azur
 
 | Model  | Type | Capabilities | 
 | ------ | ---- | --- | 
+| [Cohere-command-A](https://aka.ms/aistudio/landing/cohere-command-a) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (256,000 tokens) <br /> - **Output:** text (8,000 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text |
 | [Cohere-command-r-plus-08-2024](https://ai.azure.com/explore/models/Cohere-command-r-plus-08-2024/version/1/registry/azureml-cohere) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (131,072 tokens) <br /> - **Output:** text (4,096 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON |
 | [Cohere-command-r-08-2024](https://ai.azure.com/explore/models/Cohere-command-r-08-2024/version/1/registry/azureml-cohere) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (131,072 tokens) <br /> - **Output:** text (4,096 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON |
 | [Cohere-command-r-plus](https://ai.azure.com/explore/models/Cohere-command-r-plus/version/1/registry/azureml-cohere) <br> (deprecated) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (131,072 tokens) <br /> - **Output:** text (4,096 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON |
 | [Cohere-command-r](https://ai.azure.com/explore/models/Cohere-command-r/version/1/registry/azureml-cohere) <br> (deprecated)| [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (131,072 tokens) <br /> - **Output:** text (4,096 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text, JSON |
+| [Cohere-embed-4](https://aka.ms/aistudio/landing/cohere-embed-4) | [embeddings](../model-inference/how-to/use-embeddings.md?context=/azure/ai-foundry/context/context) <br /> [image-embeddings](../model-inference/how-to/use-image-embeddings.md?context=/azure/ai-foundry/context/context) | - **Input:** image, text <br /> - **Output:** image, text (128,000 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** image, text  |
 | [Cohere-embed-v3-english](https://ai.azure.com/explore/models/Cohere-embed-v3-english/version/1/registry/azureml-cohere) | [embeddings](../model-inference/how-to/use-embeddings.md?context=/azure/ai-foundry/context/context) <br /> [image-embeddings](../model-inference/how-to/use-image-embeddings.md?context=/azure/ai-foundry/context/context) | - **Input:** text (512 tokens) <br /> - **Output:** Vector (1,024 dim.) |
 | [Cohere-embed-v3-multilingual](https://ai.azure.com/explore/models/Cohere-embed-v3-multilingual/version/1/registry/azureml-cohere) | [embeddings](../model-inference/how-to/use-embeddings.md?context=/azure/ai-foundry/context/context) <br /> [image-embeddings](../model-inference/how-to/use-image-embeddings.md?context=/azure/ai-foundry/context/context) | - **Input:** text (512 tokens) <br /> - **Output:** Vector (1,024 dim.) |
 
@@ -141,11 +143,12 @@ For more examples of how to use Jais models, see the following examples:
 
 ## DeepSeek
 
-DeepSeek family of models includes DeepSeek-R1, which excels at reasoning tasks using a step-by-step training process, such as language, scientific reasoning, and coding tasks, and DeepSeek-V3, a Mixture-of-Experts (MoE) language model. 
+DeepSeek family of models includes DeepSeek-R1, which excels at reasoning tasks using a step-by-step training process, such as language, scientific reasoning, and coding tasks, DeepSeek-V3-0324, a Mixture-of-Experts (MoE) language model, and more. 
 
 | Model  | Type | Capabilities | 
 | ------ | ---- | --- | 
-| [DeepSeek-V3](https://ai.azure.com/explore/models/deepseek-v3/version/1/registry/azureml-deepseek) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (131,072 tokens) <br /> - **Output:** text (131,072 tokens) <br />  - **Tool calling:** No <br /> - **Response formats:** Text, JSON |
+| [DeekSeek-V3-0324](https://ai.azure.com/explore/models/deepseek-v3-0324/version/1/registry/azureml-deepseek) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (131,072 tokens) <br /> - **Output:** (131,072 tokens) <br /> - **Tool calling:** No <br /> - **Response formats:** Text, JSON |
+| [DeepSeek-V3](https://ai.azure.com/explore/models/deepseek-v3/version/1/registry/azureml-deepseek) <br />(Legacy) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (131,072 tokens) <br /> - **Output:** text (131,072 tokens) <br />  - **Tool calling:** No <br /> - **Response formats:** Text, JSON |
 | [DeepSeek-R1](https://ai.azure.com/explore/models/deepseek-r1/version/1/registry/azureml-deepseek) | [chat-completion with reasoning content](../model-inference/how-to/use-chat-reasoning.md?context=/azure/ai-foundry/context/context) | - **Input:** text (163,840 tokens) <br /> - **Output:** text (163,840 tokens) <br />  - **Tool calling:** No <br /> - **Response formats:** Text. |
 
 For a tutorial on DeepSeek-R1, see [Tutorial: Get started with DeepSeek-R1 reasoning model in Azure AI model inference](../model-inference/tutorials/get-started-deepseek-r1.md?context=/azure/ai-foundry/context/context).
@@ -171,9 +174,12 @@ Meta Llama models and tools are a collection of pretrained and fine-tuned genera
 - Small language models (SLMs) like 1B and 3B Base and Instruct models for on-device and edge inferencing
 - Mid-size large language models (LLMs) like 7B, 8B, and 70B Base and Instruct models
 - High-performant models like Meta Llama 3.1-405B Instruct for synthetic data generation and distillation use cases.
+- High-performant natively multimodal models, Llama 4 Scout and Llama 4 Maverick, leverage a mixture-of-experts architecture to offer industry-leading performance in text and image understanding.
 
 | Model  | Type | Capabilities |
 | ------ | ---- | ------------ |
+| [Llama-4-Scout-17B-16E-Instruct](https://aka.ms/aifoundry/landing/llama-4-scout-17b-16e-instruct) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text and image (128,000 tokens) <br /> - **Output:** text (8,192 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text |
+| [Llama 4-Maverick-17B-128E-Instruct-FP8](https://aka.ms/aifoundry/landing/llama-4-maverick-17b-128e-instruct-fp8) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text and image (128,000 tokens) <br /> - **Output:** text (8,192 tokens) <br /> - **Tool calling:** Yes <br /> - **Response formats:** Text |
 | [Llama-3.3-70B-Instruct](https://ai.azure.com/explore/models/Llama-3.3-70B-Instruct/version/4/registry/azureml-meta) | [chat-completion](../model-inference/how-to/use-chat-completions.md?context=/azure/ai-foundry/context/context) | - **Input:** text (128,000 tokens) <br /> - **Output:** text (8,192 tokens) <br /> - **Tool calling:** No <br /> - **Response formats:** Text |
 | [Llama-3.2-90B-Vision-Instruct](https://ai.azure.com/explore/models/Llama-3.2-90B-Vision-Instruct/version/1/registry/azureml-meta) | [chat-completion (with images)](../model-inference/how-to/use-chat-multi-modal.md?context=/azure/ai-foundry/context/context) | - **Input:** text and image (128,000 tokens) <br /> - **Output:** text (8,192 tokens) <br /> - **Tool calling:** No <br /> - **Response formats:** Text |
 | [Llama-3.2-11B-Vision-Instruct](https://ai.azure.com/explore/models/Llama-3.2-11B-Vision-Instruct/version/1/registry/azureml-meta) | [chat-completion (with images)](../model-inference/how-to/use-chat-multi-modal.md?context=/azure/ai-foundry/context/context) | - **Input:** text and image (128,000 tokens) <br /> - **Output:** text (8,192 tokens) <br /> - **Tool calling:** No <br /> - **Response formats:** Text |
 
@@ -73,7 +73,7 @@ ml_client.connections.create_or_update(wps_connection)
 
 ## Azure AI services
 
-The following example creates an Azure AI services connection. This example creates one connection for the AI services documented in the [Connect to Azure AI services](../../ai-services/how-to/connect-ai-services.md) article. The same connection also supports the Azure OpenAI service.
+The following example creates an Azure AI services connection. This example creates one connection for the AI services documented in the [Connect to Azure AI services](../../../ai-services/connect-services-ai-foundry-portal.md) article. The same connection also supports the Azure OpenAI service.
 
 ```python
 from azure.ai.ml.entities import AzureAIServicesConnection, ApiKeyConfiguration
Original file line number	Diff line number	Diff line change
`@@ -110,6 +110,11 @@`
`110`	`110`	`"redirect_url": "/azure/ai-foundry/how-to/data-add",`
`111`	`111`	`"redirect_document_id": true`
`112`	`112`	`},`
	`113`	`+ {`
	`114`	`+ "source_path_from_root": "/articles/ai-foundry/model-inference/reference/api-version-updates.md",`
	`115`	`+ "redirect_url": "/rest/api/aifoundry/modelinference",`
	`116`	`+ "redirect_document_id": false`
	`117`	`+ },`
`113`	`118`	`{`
`114`	`119`	`"source_path_from_root": "/articles/ai-studio/how-to/deploy-models-cohere-command.md",`
`115`	`120`	`"redirect_url": "/azure/ai-foundry/how-to/deploy-models-cohere-command",`
`@@ -699,8 +704,8 @@`
`699`	`704`	`},`
`700`	`705`	`{`
`701`	`706`	`"source_path_from_root": "/articles/ai-studio/ai-services/how-to/connect-ai-services.md",`
`702`		`- "redirect_url": "/azure/ai-foundry/ai-services/how-to/connect-ai-services",`
`703`		`- "redirect_document_id": true`
	`707`	`+ "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",`
	`708`	`+ "redirect_document_id": false`
`704`	`709`	`},`
`705`	`710`	`{`
`706`	`711`	`"source_path_from_root": "/articles/ai-studio/ai-services/how-to/connect-azure-openai.md",`
`@@ -875,7 +880,7 @@`
`875`	`880`	`},`
`876`	`881`	`{`
`877`	`882`	`"source_path_from_root": "/articles/ai-studio/how-to/models-foundation-azure-ai.md",`
`878`		`- "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",`
	`883`	`+ "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",`
`879`	`884`	`"redirect_document_id": true`
`880`	`885`	`},`
`881`	`886`	`{`
`@@ -955,17 +960,17 @@`
`955`	`960`	`},`
`956`	`961`	`{`
`957`	`962`	`"source_path_from_root": "/articles/ai-studio/ai-services/get-started.md",`
`958`		`- "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",`
	`963`	`+ "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",`
`959`	`964`	`"redirect_document_id": false`
`960`	`965`	`},`
`961`	`966`	`{`
`962`	`967`	`"source_path_from_root": "/articles/ai-studio/ai-services/where-to-use-ai-services.md",`
`963`		`- "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",`
	`968`	`+ "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",`
`964`	`969`	`"redirect_document_id": false`
`965`	`970`	`},`
`966`	`971`	`{`
`967`	`972`	`"source_path_from_root": "/articles/ai-studio/ai-services/connect-ai-services.md",`
`968`		`- "redirect_url": "/azure/ai-studio/ai-services/how-to/connect-ai-services",`
	`973`	`+ "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",`
`969`	`974`	`"redirect_document_id": false`
`970`	`975`	`},`
`971`	`976`	`{`
`@@ -1127,6 +1132,11 @@`
`1127`	`1132`	`"source_path_from_root": "/articles/ai-foundry/how-to/prompt-flow.md",`
`1128`	`1133`	`"redirect_url": "/azure/ai-foundry/concepts/prompt-flow",`
`1129`	`1134`	`"redirect_document_id": true`
	`1135`	`+ },`
	`1136`	`+ {`
	`1137`	`+ "source_path_from_root": "/articles/ai-foundry/ai-services/how-to/connect-ai-services.md",`
	`1138`	`+ "redirect_url": "/azure/ai-services/connect-services-ai-foundry-portal",`
	`1139`	`+ "redirect_document_id": false`
`1130`	`1140`	`}`
`1131`	`1141`	`]`
`1132`	`1142`	`}`