Skip to content

Commit 699e496

Browse files
Merge pull request #208 from Azure-Samples/model-router
Adding gpt-5
2 parents 5639a4d + 42ab7cf commit 699e496

File tree

3 files changed

+5
-3
lines changed

3 files changed

+5
-3
lines changed

images/model-routing.gif

-5.49 KB
Loading

labs/model-routing/model-routing.ipynb

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -58,6 +58,7 @@
5858
" {\"name\": \"gpt-4.1-mini\", \"publisher\": \"OpenAI\", \"version\": \"2025-04-14\", \"sku\": \"GlobalStandard\", \"capacity\": 20, \"aiservice\": \"foundry2\"},\n",
5959
" {\"name\": \"gpt-4.1-nano\", \"publisher\": \"OpenAI\", \"version\": \"2025-04-14\", \"sku\": \"GlobalStandard\", \"capacity\": 20, \"aiservice\": \"foundry2\"},\n",
6060
" {\"name\": \"model-router\", \"publisher\": \"OpenAI\", \"version\": \"2025-05-19\", \"sku\": \"GlobalStandard\", \"capacity\": 20, \"aiservice\": \"foundry3\"},\n",
61+
" {\"name\": \"gpt-5\", \"publisher\": \"OpenAI\", \"version\": \"2025-08-07\", \"sku\": \"GlobalStandard\", \"capacity\": 20, \"aiservice\": \"foundry3\"},\n",
6162
" {\"name\": \"DeepSeek-R1\", \"publisher\": \"DeepSeek\", \"version\": \"1\", \"sku\": \"GlobalStandard\", \"capacity\": 20, \"aiservice\": \"foundry3\"}]\n",
6263
"\n",
6364
"apim_sku = 'Basicv2'\n",
@@ -202,7 +203,7 @@
202203
" api_version=inference_api_version\n",
203204
")\n",
204205
"try:\n",
205-
" for model in ['model-router', 'DeepSeek-R1', 'gpt-4.1']:\n",
206+
" for model in ['model-router', 'DeepSeek-R1', 'gpt-4.1', 'gpt-5']:\n",
206207
" completion = client.chat.completions.with_raw_response.create(model=model, messages=messages)\n",
207208
" # print(\"headers \", completion.headers)\n",
208209
" print(\"x-ms-region: \", completion.headers.get(\"x-ms-region\")) # this header is useful to determine the region of the backend that served the request\n",
@@ -238,7 +239,7 @@
238239
" api_version=inference_api_version\n",
239240
")\n",
240241
"try:\n",
241-
" for model in ['gpt-4.1-mini', 'gpt-4.1-nano', 'gpt-4.1']:\n",
242+
" for model in ['gpt-4.1-mini', 'gpt-4.1-nano', 'gpt-4.1', 'gpt-5']:\n",
242243
" responses = client.responses.with_raw_response.create(model=model, input=input_message)\n",
243244
" # print(\"headers \", responses.headers)\n",
244245
" print(\"x-ms-region: \", responses.headers.get(\"x-ms-region\"))\n",

labs/model-routing/policy.xml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,8 @@
2727
<set-backend-service backend-id="foundry2" />
2828
</when>
2929
<when condition="@( ((string)context.Variables["requestedModel"]) == "model-router"
30-
|| ((string)context.Variables["requestedModel"]) == "DeepSeek-R1")">
30+
|| ((string)context.Variables["requestedModel"]) == "gpt-5"
31+
|| ((string)context.Variables["requestedModel"]) == "DeepSeek-R1")">
3132
<set-backend-service backend-id="foundry3" />
3233
</when>
3334
<!-- gate any GPT-4o* variants -->

0 commit comments

Comments
 (0)