From 42d2a53c1d573c1f0f9b69e02c6e8536aa92bbb5 Mon Sep 17 00:00:00 2001 From: Priyanka-Microsoft Date: Mon, 14 Jul 2025 12:46:18 +0530 Subject: [PATCH] updated model capacity minimume to 200 --- .github/workflows/CAdeploy.yml | 4 ++-- docs/QuotaCheck.md | 8 ++++---- infra/scripts/quota_check_params.sh | 2 +- 3 files changed, 7 insertions(+), 7 deletions(-) diff --git a/.github/workflows/CAdeploy.yml b/.github/workflows/CAdeploy.yml index c63599e2b..73806dbbc 100644 --- a/.github/workflows/CAdeploy.yml +++ b/.github/workflows/CAdeploy.yml @@ -10,8 +10,8 @@ on: - cron: '0 6,18 * * *' # Runs at 6:00 AM and 6:00 PM GMT env: - GPT_MIN_CAPACITY: 250 - TEXT_EMBEDDING_MIN_CAPACITY: 40 + GPT_MIN_CAPACITY: 200 + TEXT_EMBEDDING_MIN_CAPACITY: 80 BRANCH_NAME: ${{ github.head_ref || github.ref_name }} jobs: diff --git a/docs/QuotaCheck.md b/docs/QuotaCheck.md index 872106410..b5a9818c3 100644 --- a/docs/QuotaCheck.md +++ b/docs/QuotaCheck.md @@ -11,7 +11,7 @@ azd auth login ### 📌 Default Models & Capacities: ``` -gpt-4o-mini:30, text-embedding-ada-002:80 +gpt-4o-mini:200, text-embedding-ada-002:80 ``` ### 📌 Default Regions: ``` @@ -37,7 +37,7 @@ eastus, uksouth, eastus2, northcentralus, swedencentral, westus, westus2, southc ``` ✔️ Check specific model(s) in default regions: ``` - ./quota_check_params.sh --models gpt-4o-mini:30,text-embedding-ada-002:80 + ./quota_check_params.sh --models gpt-4o-mini:200,text-embedding-ada-002:80 ``` ✔️ Check default models in specific region(s): ``` @@ -45,11 +45,11 @@ eastus, uksouth, eastus2, northcentralus, swedencentral, westus, westus2, southc ``` ✔️ Passing Both models and regions: ``` - ./quota_check_params.sh --models gpt-4o-mini:30 --regions eastus,westus2 + ./quota_check_params.sh --models gpt-4o-mini:200 --regions eastus,westus2 ``` ✔️ All parameters combined: ``` - ./quota_check_params.sh --models gpt-4o-mini:30,text-embedding-ada-002:80 --regions eastus,westus --verbose + ./quota_check_params.sh --models gpt-4o-mini:200,text-embedding-ada-002:80 --regions eastus,westus --verbose ``` ### **Sample Output** diff --git a/infra/scripts/quota_check_params.sh b/infra/scripts/quota_check_params.sh index 62a2305c8..ace6808a1 100755 --- a/infra/scripts/quota_check_params.sh +++ b/infra/scripts/quota_check_params.sh @@ -47,7 +47,7 @@ log_verbose() { } # Default Models and Capacities (Comma-separated in "model:capacity" format) -DEFAULT_MODEL_CAPACITY="gpt-4o-mini:30,text-embedding-ada-002:80" +DEFAULT_MODEL_CAPACITY="gpt-4o-mini:200,text-embedding-ada-002:80" # Convert the comma-separated string into an array IFS=',' read -r -a MODEL_CAPACITY_PAIRS <<< "$DEFAULT_MODEL_CAPACITY"