Skip to content

Commit f95b5f9

Browse files
committed
Port to gpt-4o-mini
1 parent 8db5812 commit f95b5f9

2 files changed

Lines changed: 12 additions & 7 deletions

File tree

‎README.md‎

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@ so that you can use the OpenAI API SDKs with keyless (Entra) authentication.
3737

3838
* Provisions an Azure OpenAI account with keyless authentication enabled
3939
* Grants the "Cognitive Services OpenAI User" RBAC role to your user account
40-
* Deploys a gpt-3.5 model by default, but you can modify the [Bicep template](infra/main.bicep) to deploy other models
40+
* Deploys a gpt-4o-mini model by default, but you can modify the [Bicep template](infra/main.bicep) to deploy other models
4141
* Example script uses the [openai](https://pypi.org/project/openai/) Python package to make a request to the Azure OpenAI API
4242

4343
### Architecture diagram

‎infra/main.bicep‎

Lines changed: 11 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -7,25 +7,30 @@ param environmentName string
77

88
@minLength(1)
99
@description('Location for the OpenAI resource')
10-
// https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models#standard-deployment-model-availability
10+
// https://learn.microsoft.com/azure/ai-services/openai/concepts/models?tabs=python-secure%2Cglobal-standard%2Cstandard-chat-completions#models-by-deployment-type
1111
@allowed([
1212
'australiaeast'
1313
'brazilsouth'
1414
'canadaeast'
1515
'eastus'
1616
'eastus2'
1717
'francecentral'
18+
'germanywestcentral'
1819
'japaneast'
20+
'koreacentral'
1921
'northcentralus'
2022
'norwayeast'
23+
'polandcentral'
2124
'southafricanorth'
2225
'southcentralus'
2326
'southindia'
27+
'spaincentral'
2428
'swedencentral'
2529
'switzerlandnorth'
2630
'uksouth'
2731
'westeurope'
2832
'westus'
33+
'westus3'
2934
])
3035
@metadata({
3136
azd: {
@@ -35,15 +40,15 @@ param environmentName string
3540
param location string
3641

3742
@description('Name of the GPT model to deploy')
38-
param gptModelName string = 'gpt-35-turbo'
43+
param gptModelName string = 'gpt-4o-mini'
3944

4045
@description('Version of the GPT model to deploy')
4146
// See version availability in this table:
42-
// https://learn.microsoft.com/azure/ai-services/openai/concepts/models#gpt-4-and-gpt-4-turbo-preview-models
43-
param gptModelVersion string = '0125'
47+
// https://learn.microsoft.com/azure/ai-services/openai/concepts/models?tabs=python-secure%2Cglobal-standard%2Cstandard-chat-completions#models-by-deployment-type
48+
param gptModelVersion string = '2024-07-18'
4449

4550
@description('Name of the model deployment (can be different from the model name)')
46-
param gptDeploymentName string = 'gpt-35-turbo'
51+
param gptDeploymentName string = 'gpt-4o-mini'
4752

4853
@description('Capacity of the GPT deployment')
4954
// You can increase this, but capacity is limited per model/region, so you will get errors if you go over
@@ -93,7 +98,7 @@ module openAi 'br/public:avm/res/cognitive-services/account:0.7.1' = {
9398
version: gptModelVersion
9499
}
95100
sku: {
96-
name: 'Standard'
101+
name: 'GlobalStandard'
97102
capacity: gptDeploymentCapacity
98103
}
99104
}

0 commit comments

Comments
 (0)