Merge pull request #242 from microsoft/aitemplate_updates

malrose07 · web-flow · commit efe4d108810f · 2025-02-20T12:15:45.000-08:00
fix: update yaml, readme and bicep
diff --git a/README.md b/README.md
@@ -70,14 +70,14 @@ Please check the link [Azure Products by Region](https://azure.microsoft.com/en-
 
 -  Embedding model capacity
 
-### Quota Recommendations
-- Please deploy with minimum **30k tokens**.
-- For optimal performance, it is recommended to increase token to **100K**
-- You can also view the Quotas tab in [Azure OpenAI studio](https://oai.azure.com/)
-  to understand how much capacity you have.
-
-![image](./docs/Images/ReadMe/quotaImage.png)
-
+### [Optional]: Quota Recommendations
+- The default for the GPT model capacity in deployment is **30k tokens**.
+    - For optimal performance, it is recommended to increase to **100k tokens**. 
+- Navigate to the [Azure AI Foundry portal](https://ai.azure.com/)
+- Select the AI Project you are using for this accelerator if you are not already in the project.
+- Select `Management center` from the bottom left navigation menu
+- Select `Quota`, click the `GlobalStandard` dropdown and select the GPT model and region you are using for this accelerator to see your available quota. 
+- Request more quota or delete any unused model deployments as needed. 
  
 
 ### **Options**
@@ -211,7 +211,7 @@ azd env set AZURE_ENV_MODEL_NAME gpt-4o-mini
 Change the Model Capacity (choose a number based on available GPT model capacity in your subscription)
 
 ```shell
-azd env set AZURE_ENV_MODEL_CAPACITY 100
+azd env set AZURE_ENV_MODEL_CAPACITY 30
 ```
 
 Change the Embedding Model 
diff --git a/azure.yaml b/azure.yaml
@@ -4,7 +4,7 @@
 environment:
   name: conversation-knowledge-mining
   location: eastus
-
+name: conversation-knowledge-mining
 metadata:
   template: conversation-knowledge-mining@1.0
 
diff --git a/infra/main.bicep b/infra/main.bicep
@@ -50,7 +50,7 @@ var gptModelVersion = '2024-02-15-preview'
 @description('Capacity of the GPT deployment:')
 // You can increase this, but capacity is limited per model/region, so you will get errors if you go over
 // https://learn.microsoft.com/en-us/azure/ai-services/openai/quotas-limits
-param gptDeploymentCapacity int = 100
+param gptDeploymentCapacity int = 30
 
 @minLength(1)
 @description('Name of the Text Embedding model to deploy:')
diff --git a/infra/main.bicepparam b/infra/main.bicepparam
@@ -5,6 +5,6 @@ param contentUnderstandingLocation = readEnvironmentVariable('AZURE_ENV_CU_LOCAT
 param secondaryLocation = readEnvironmentVariable('AZURE_ENV_SECONDARY_LOCATION', 'eastus2')
 param deploymentType = readEnvironmentVariable('AZURE_ENV_MODEL_DEPLOYMENT_TYPE', 'GlobalStandard')
 param gptModelName = readEnvironmentVariable('AZURE_ENV_MODEL_NAME', 'gpt-4o-mini')
-param gptDeploymentCapacity = int(readEnvironmentVariable('AZURE_ENV_MODEL_CAPACITY', '100'))
+param gptDeploymentCapacity = int(readEnvironmentVariable('AZURE_ENV_MODEL_CAPACITY', '30'))
 param embeddingModel = readEnvironmentVariable('AZURE_ENV_EMBEDDING_MODEL_NAME', 'text-embedding-ada-002')
 param embeddingDeploymentCapacity = int(readEnvironmentVariable('AZURE_ENV_EMBEDDING_MODEL_CAPACITY', '80'))
diff --git a/infra/main.json b/infra/main.json
@@ -4,8 +4,8 @@
   "metadata": {
     "_generator": {
       "name": "bicep",
-      "version": "0.31.92.45157",
-      "templateHash": "11629204665350113499"
+      "version": "0.33.93.31351",
+      "templateHash": "10535791601593705798"
     }
   },
   "parameters": {
@@ -66,7 +66,7 @@
     },
     "gptDeploymentCapacity": {
       "type": "int",
-      "defaultValue": 100,
+      "defaultValue": 30,
       "minValue": 10,
       "metadata": {
         "description": "Capacity of the GPT deployment:"
@@ -129,8 +129,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "14275103612814336681"
+              "version": "0.33.93.31351",
+              "templateHash": "4123789684929590981"
             }
           },
           "parameters": {
@@ -221,8 +221,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "5910651074687744132"
+              "version": "0.33.93.31351",
+              "templateHash": "4388214478635448075"
             }
           },
           "parameters": {
@@ -365,8 +365,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "15158547531678904427"
+              "version": "0.33.93.31351",
+              "templateHash": "7803735516770365352"
             }
           },
           "parameters": {
@@ -1057,8 +1057,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "8276956277243695834"
+              "version": "0.33.93.31351",
+              "templateHash": "14620142974675285735"
             }
           },
           "parameters": {
@@ -1241,8 +1241,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "15083329960647515030"
+              "version": "0.33.93.31351",
+              "templateHash": "3100365088410602500"
             }
           },
           "parameters": {
@@ -1289,7 +1289,7 @@
           "resources": [
             {
               "copy": {
-                "name": "list",
+                "name": "database::list",
                 "count": "[length(variables('containers'))]"
               },
               "type": "Microsoft.DocumentDB/databaseAccounts/sqlDatabases/containers",
@@ -1447,8 +1447,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "5779941490382286977"
+              "version": "0.33.93.31351",
+              "templateHash": "6170430466600233564"
             }
           },
           "parameters": {
@@ -1621,8 +1621,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "9223261981384212100"
+              "version": "0.33.93.31351",
+              "templateHash": "509460209037223451"
             }
           },
           "parameters": {
@@ -1704,8 +1704,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "2728825545778646651"
+              "version": "0.33.93.31351",
+              "templateHash": "16955379019952955448"
             }
           },
           "parameters": {
@@ -1800,8 +1800,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "10011942677204719320"
+              "version": "0.33.93.31351",
+              "templateHash": "7630355864427423039"
             }
           },
           "parameters": {
@@ -2036,8 +2036,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "8269871966991453242"
+              "version": "0.33.93.31351",
+              "templateHash": "17601259288614778920"
             }
           },
           "parameters": {
@@ -2287,8 +2287,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "7009743990995290371"
+              "version": "0.33.93.31351",
+              "templateHash": "18414416216987649125"
             }
           },
           "parameters": {
@@ -2399,8 +2399,8 @@
           "metadata": {
             "_generator": {
               "name": "bicep",
-              "version": "0.31.92.45157",
-              "templateHash": "14810546478282650129"
+              "version": "0.33.93.31351",
+              "templateHash": "2717758861842552802"
             }
           },
           "parameters": {