Skip to content

Commit 4376279

Browse files
update model type to global standard
1 parent 4cf502e commit 4376279

File tree

4 files changed

+7
-7
lines changed

4 files changed

+7
-7
lines changed

.github/workflows/CI.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -196,15 +196,15 @@ jobs:
196196
# Increase the TPM for the Azure OpenAI models
197197
echo "Increasing TPM for Azure OpenAI models..."
198198
openai_gpt_deployment_url="/subscriptions/${{ secrets.AZURE_SUBSCRIPTION_ID }}/resourceGroups/${{ env.rg_name }}/providers/Microsoft.CognitiveServices/accounts/$openai_resource_name/deployments/gpt-4o-mini?api-version=2023-05-01"
199-
az rest -m put -u "$openai_gpt_deployment_url" -b "{'sku':{'name':'Standard','capacity':${{ env.GPT_CAPACITY }}},'properties': {'model': {'format': 'OpenAI','name': 'gpt-4o-mini','version': '2024-07-18'}}}"
199+
az rest -m put -u "$openai_gpt_deployment_url" -b "{'sku':{'name':'GlobalStandard','capacity':${{ env.GPT_CAPACITY }}},'properties': {'model': {'format': 'OpenAI','name': 'gpt-4o-mini','version': '2024-07-18'}}}"
200200
if [ $? -ne 0 ]; then
201201
echo "Failed to increase TPM for GPT deployment."
202202
exit 1
203203
else
204204
echo "Successfully increased TPM for GPT deployment."
205205
fi
206206
openai_embedding_deployment_url="/subscriptions/${{ secrets.AZURE_SUBSCRIPTION_ID }}/resourceGroups/${{ env.rg_name }}/providers/Microsoft.CognitiveServices/accounts/$openai_resource_name/deployments/text-embedding-large?api-version=2023-05-01"
207-
az rest -m put -u "$openai_embedding_deployment_url" -b "{'sku':{'name':'Standard','capacity': ${{ env.TEXT_EMBEDDING_CAPACITY }}},'properties': {'model': {'format': 'OpenAI','name': 'text-embedding-3-large','version': '1'}}}"
207+
az rest -m put -u "$openai_embedding_deployment_url" -b "{'sku':{'name':'GlobalStandard','capacity': ${{ env.TEXT_EMBEDDING_CAPACITY }}},'properties': {'model': {'format': 'OpenAI','name': 'text-embedding-3-large','version': '1'}}}"
208208
if [ $? -ne 0 ]; then
209209
echo "Failed to increase TPM for Text Embedding deployment."
210210
exit 1

Deployment/bicep/azureopenaiservicemodel.bicep

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ resource gpt4Deployment 'Microsoft.CognitiveServices/accounts/deployments@2023-0
1010
parent: openAIService
1111
name: name
1212
sku: {
13-
name: 'Standard'
13+
name: 'GlobalStandard'
1414
capacity: model.capacity
1515
}
1616
properties: {

Deployment/checkquota.ps1

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -45,8 +45,8 @@ Write-Host "✅ Azure subscription set successfully."
4545

4646
# Define models and their minimum required capacities
4747
$MIN_CAPACITY = @{
48-
"OpenAI.Standard.gpt-4o-mini" = $GPT_MIN_CAPACITY
49-
"OpenAI.Standard.text-embedding-3-large" = $TEXT_EMBEDDING_MIN_CAPACITY
48+
"OpenAI.GlobalStandard.gpt-4o-mini" = $GPT_MIN_CAPACITY
49+
"OpenAI.GlobalStandard.text-embedding-3-large" = $TEXT_EMBEDDING_MIN_CAPACITY
5050
}
5151

5252
$VALID_REGION = ""

Deployment/main.bicep

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -119,7 +119,7 @@ module gs_openaiservicemodels_gpt4o 'bicep/azureopenaiservicemodel.bicep' = {
119119
version: '2024-07-18'
120120
raiPolicyName: ''
121121
capacity: 1
122-
scaleType: 'Standard'
122+
scaleType: 'GlobalStandard'
123123
}
124124

125125
}
@@ -139,7 +139,7 @@ module gs_openaiservicemodels_text_embedding 'bicep/azureopenaiservicemodel.bice
139139
version: '1'
140140
raiPolicyName: ''
141141
capacity: 1
142-
scaleType: 'Standard'
142+
scaleType: 'GlobalStandard'
143143
}
144144
}
145145
dependsOn: [

0 commit comments

Comments
 (0)