@@ -21,7 +21,7 @@ param existingLogAnalyticsWorkspaceId string = ''
2121 azd : {
2222 type : 'location'
2323 usageName : [
24- 'OpenAI.GlobalStandard.gpt-4o, 50 '
24+ 'OpenAI.GlobalStandard.gpt-4o, 150 '
2525 ]
2626 }
2727})
@@ -39,6 +39,9 @@ param gptModelVersion string = '2024-08-06'
3939@description ('GPT model deployment type:' )
4040param modelDeploymentType string = 'GlobalStandard'
4141
42+ @description ('Optional. AI model deployment token capacity.' )
43+ param gptModelCapacity int = 150
44+
4245@description ('Set the image tag for the container images used in the solution. Default is "latest".' )
4346param imageTag string = 'latest'
4447
@@ -157,7 +160,7 @@ param aiFoundryAiServicesConfiguration aiServicesConfigurationType = {
157160 sku : 'S0'
158161 deployments : null //Default value set on module configuration
159162 subnetResourceId : null //Default value set on module configuration
160- modelCapacity : 50
163+ modelCapacity : gptModelCapacity
161164}
162165
163166@description ('Optional. The configuration to apply for the AI Foundry AI Project resource.' )
@@ -742,7 +745,7 @@ var aiFoundryAiServicesModelDeployment = {
742745 sku : {
743746 name : modelDeploymentType
744747 //Curently the capacity is set to 140 for opinanal performance.
745- capacity : aiFoundryAiServicesConfiguration .?modelCapacity ?? 50
748+ capacity : aiFoundryAiServicesConfiguration .?modelCapacity ?? gptModelCapacity
746749 }
747750 raiPolicyName : 'Microsoft.Default'
748751}
0 commit comments