Skip to content

Commit 37125bd

Browse files
Add gptModelCapacity parameter and update model capacity references
1 parent 37c62a0 commit 37125bd

File tree

2 files changed

+9
-3
lines changed

2 files changed

+9
-3
lines changed

infra/main.bicep

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ param existingLogAnalyticsWorkspaceId string = ''
2121
azd : {
2222
type: 'location'
2323
usageName : [
24-
'OpenAI.GlobalStandard.gpt-4o, 50'
24+
'OpenAI.GlobalStandard.gpt-4o, 150'
2525
]
2626
}
2727
})
@@ -39,6 +39,9 @@ param gptModelVersion string = '2024-08-06'
3939
@description('GPT model deployment type:')
4040
param modelDeploymentType string = 'GlobalStandard'
4141

42+
@description('Optional. AI model deployment token capacity.')
43+
param gptModelCapacity int = 150
44+
4245
@description('Set the image tag for the container images used in the solution. Default is "latest".')
4346
param imageTag string = 'latest'
4447

@@ -157,7 +160,7 @@ param aiFoundryAiServicesConfiguration aiServicesConfigurationType = {
157160
sku: 'S0'
158161
deployments: null //Default value set on module configuration
159162
subnetResourceId: null //Default value set on module configuration
160-
modelCapacity: 50
163+
modelCapacity: gptModelCapacity
161164
}
162165

163166
@description('Optional. The configuration to apply for the AI Foundry AI Project resource.')
@@ -742,7 +745,7 @@ var aiFoundryAiServicesModelDeployment = {
742745
sku: {
743746
name: modelDeploymentType
744747
//Curently the capacity is set to 140 for opinanal performance.
745-
capacity: aiFoundryAiServicesConfiguration.?modelCapacity ?? 50
748+
capacity: aiFoundryAiServicesConfiguration.?modelCapacity ?? gptModelCapacity
746749
}
747750
raiPolicyName: 'Microsoft.Default'
748751
}

infra/main.parameters.json

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,9 @@
3636
"gptModelVersion": {
3737
"value": "${AZURE_ENV_MODEL_VERSION}"
3838
},
39+
"gptModelCapacity": {
40+
"value": "${AZURE_ENV_MODEL_CAPACITY}"
41+
},
3942
"imageTag": {
4043
"value": "${AZURE_ENV_IMAGE_TAG}"
4144
},

0 commit comments

Comments
 (0)