diff --git a/docs/QuotaCheck.md b/docs/QuotaCheck.md index a0f8a313..623686eb 100644 --- a/docs/QuotaCheck.md +++ b/docs/QuotaCheck.md @@ -1,7 +1,7 @@ ## Check Quota Availability Before Deployment Before deploying the accelerator, **ensure sufficient quota availability** for the required model. -> **For Global Standard | gpt-4.1-mini - increase the capacity to at least 50K tokens for optimal performance.** +> **For Global Standard | gpt4.1-mini - increase the capacity to at least 50K tokens for optimal performance.** ### Login if you have not done so already ``` @@ -11,7 +11,7 @@ azd auth login ### 📌 Default Models & Capacities: ``` -gpt-4.1-mini:30, text-embedding-ada-002:45 +gpt4.1-mini:30, text-embedding-ada-002:45 ``` ### 📌 Default Regions: ``` @@ -37,7 +37,7 @@ australiaeast, francecentral, japaneast, northcentralus, southcentralus, westus, ``` ✔️ Check specific model(s) in default regions: ``` - ./quota_check_params.sh --models gpt-4.1-mini:30,text-embedding-ada-002:45 + ./quota_check_params.sh --models gpt4.1-mini:30,text-embedding-ada-002:45 ``` ✔️ Check default models in specific region(s): ``` @@ -45,11 +45,11 @@ australiaeast, francecentral, japaneast, northcentralus, southcentralus, westus, ``` ✔️ Passing Both models and regions: ``` - ./quota_check_params.sh --models gpt-4.1-mini:30 --regions eastus,westus + ./quota_check_params.sh --models gpt4.1-mini:30 --regions eastus,westus ``` ✔️ All parameters combined: ``` - ./quota_check_params.sh --models gpt-4.1-mini:30,text-embedding-ada-002:45 --regions eastus,westus --verbose + ./quota_check_params.sh --models gpt4.1-mini:30,text-embedding-ada-002:45 --regions eastus,westus --verbose ``` ### **Sample Output** diff --git a/infra/scripts/checkquota.sh b/infra/scripts/checkquota.sh index 9300d23f..f9eb8ce7 100644 --- a/infra/scripts/checkquota.sh +++ b/infra/scripts/checkquota.sh @@ -32,7 +32,7 @@ echo "✅ Azure subscription set successfully." # Define models and their minimum required capacities declare -A MIN_CAPACITY=( - ["OpenAI.Standard.gpt-4.1-mini"]=$GPT_MIN_CAPACITY + ["OpenAI.GlobalStandard.gpt4.1-mini"]=$GPT_MIN_CAPACITY ["OpenAI.GlobalStandard.text-embedding-ada-002"]=$TEXT_EMBEDDING_MIN_CAPACITY ) diff --git a/infra/scripts/quota_check_params.sh b/infra/scripts/quota_check_params.sh index b5728619..ffadf77c 100644 --- a/infra/scripts/quota_check_params.sh +++ b/infra/scripts/quota_check_params.sh @@ -47,7 +47,7 @@ log_verbose() { } # Default Models and Capacities (Comma-separated in "model:capacity" format) -DEFAULT_MODEL_CAPACITY="gpt-4.1-mini:30,text-embedding-ada-002:45" +DEFAULT_MODEL_CAPACITY="gpt4.1-mini:30,text-embedding-ada-002:45" # Convert the comma-separated string into an array IFS=',' read -r -a MODEL_CAPACITY_PAIRS <<< "$DEFAULT_MODEL_CAPACITY"