Skip to content

Commit 959af52

Browse files
Merge pull request #307 from microsoft/psl-model-update
ci: model back to gpt4o due to more availability regions
2 parents cdf8856 + 82668d4 commit 959af52

File tree

5 files changed

+30
-28
lines changed

5 files changed

+30
-28
lines changed

.github/workflows/deploy.yml

+2-2
Original file line numberDiff line numberDiff line change
@@ -115,8 +115,8 @@ jobs:
115115
--parameters \
116116
environmentName="${{ env.SOLUTION_PREFIX }}" \
117117
secondaryLocation="eastus2" \
118-
deploymentType="Standard" \
119-
gptModelName="gpt-4" \
118+
deploymentType="GlobalStandard" \
119+
gptModelName="gpt-4o" \
120120
azureOpenaiAPIVersion="2024-05-01-preview" \
121121
gptDeploymentCapacity="10" \
122122
embeddingModel="text-embedding-ada-002" \

README.md

+7-5
Original file line numberDiff line numberDiff line change
@@ -73,19 +73,21 @@ When you start the deployment, most parameters will have **default values**, but
7373

7474
| **Setting** | **Description** | **Default value** |
7575
|------------|----------------| ------------|
76-
| **Azure Region** | The region where resources will be created. | East US|
76+
| **Azure Region** | The region where resources will be created. | eastus |
7777
| **Environment Name** | A **3-20 character alphanumeric value** used to generate a unique ID to prefix the resources. | byctemplate |
7878
| **Secondary Location** | A **less busy** region for **Azure SQL and CosmosDB**, useful in case of availability constraints. | eastus2 |
79-
| **Deployment Type** | Select from a drop-down list. | Standard |
80-
| **GPT Model** | Choose from **gpt-4, gpt-4o** | gpt-4 |
79+
| **Deployment Type** | Select from a drop-down list. | Global Standard |
80+
| **GPT Model** | Choose from **gpt-4, gpt-4o** | gpt-4o |
8181
| **GPT Model Deployment Capacity** | Configure capacity for **GPT models**. | 30k |
8282
| **Embedding Model** | Default: **text-embedding-ada-002**. | text-embedding-ada-002 |
8383
| **Embedding Model Capacity** | Set the capacity for **embedding models**. | 80k |
8484

8585

8686
### [Optional] Quota Recommendations
87-
By default, the **GPT model capacity** in deployment is set to **30k tokens**.
88-
> **We recommend increasing the capacity to 100k tokens for optimal performance.**
87+
By default, the **Gpt-4o model capacity** in deployment is set to **30k tokens**, so we recommend
88+
> **For GPT-4o, the capacity to at least 150k tokens post-deployment for optimal performance.**
89+
90+
> **For GPT-4, ensure a minimum of 30k–40k tokens for best results.**
8991
9092
To adjust quota settings, follow these [steps](./docs/AzureGPTQuotaSettings.md)
9193

docs/CustomizingAzdParameters.md

+1-1
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ azd env set AZURE_ENV_MODEL_DEPLOYMENT_TYPE Standard
2121
Set the Model Name (allowed values: gpt-4, gpt-4o)
2222

2323
```shell
24-
azd env set AZURE_ENV_MODEL_NAME gpt-4
24+
azd env set AZURE_ENV_MODEL_NAME gpt-4o
2525
```
2626

2727
Change the Model Capacity (choose a number based on available GPT model capacity in your subscription)

infra/main.bicep

+2-2
Original file line numberDiff line numberDiff line change
@@ -25,15 +25,15 @@ param secondaryLocation string
2525
'Standard'
2626
'GlobalStandard'
2727
])
28-
param deploymentType string = 'Standard'
28+
param deploymentType string = 'GlobalStandard'
2929

3030
@minLength(1)
3131
@description('Name of the GPT model to deploy:')
3232
@allowed([
3333
'gpt-4o'
3434
'gpt-4'
3535
])
36-
param gptModelName string = 'gpt-4'
36+
param gptModelName string = 'gpt-4o'
3737

3838
param azureOpenaiAPIVersion string = '2024-05-01-preview'
3939

infra/main.json

+18-18
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,8 @@
44
"metadata": {
55
"_generator": {
66
"name": "bicep",
7-
"version": "0.33.93.31351",
8-
"templateHash": "15906054451527240113"
7+
"version": "0.34.1.11899",
8+
"templateHash": "498892376344234261"
99
}
1010
},
1111
"parameters": {
@@ -29,7 +29,7 @@
2929
},
3030
"deploymentType": {
3131
"type": "string",
32-
"defaultValue": "Standard",
32+
"defaultValue": "GlobalStandard",
3333
"allowedValues": [
3434
"Standard",
3535
"GlobalStandard"
@@ -41,7 +41,7 @@
4141
},
4242
"gptModelName": {
4343
"type": "string",
44-
"defaultValue": "gpt-4",
44+
"defaultValue": "gpt-4o",
4545
"allowedValues": [
4646
"gpt-4o",
4747
"gpt-4"
@@ -150,8 +150,8 @@
150150
"metadata": {
151151
"_generator": {
152152
"name": "bicep",
153-
"version": "0.33.93.31351",
154-
"templateHash": "15599520231829365667"
153+
"version": "0.34.1.11899",
154+
"templateHash": "5321954130579291970"
155155
}
156156
},
157157
"parameters": {
@@ -243,8 +243,8 @@
243243
"metadata": {
244244
"_generator": {
245245
"name": "bicep",
246-
"version": "0.33.93.31351",
247-
"templateHash": "4317523167912536944"
246+
"version": "0.34.1.11899",
247+
"templateHash": "15644309813710584263"
248248
}
249249
},
250250
"parameters": {
@@ -383,8 +383,8 @@
383383
"metadata": {
384384
"_generator": {
385385
"name": "bicep",
386-
"version": "0.33.93.31351",
387-
"templateHash": "14521272418759600301"
386+
"version": "0.34.1.11899",
387+
"templateHash": "6241332452423283350"
388388
}
389389
},
390390
"parameters": {
@@ -981,8 +981,8 @@
981981
"metadata": {
982982
"_generator": {
983983
"name": "bicep",
984-
"version": "0.33.93.31351",
985-
"templateHash": "6827407487603246290"
984+
"version": "0.34.1.11899",
985+
"templateHash": "5169332991642386736"
986986
}
987987
},
988988
"parameters": {
@@ -1210,8 +1210,8 @@
12101210
"metadata": {
12111211
"_generator": {
12121212
"name": "bicep",
1213-
"version": "0.33.93.31351",
1214-
"templateHash": "15057452249812707948"
1213+
"version": "0.34.1.11899",
1214+
"templateHash": "12565043404933150402"
12151215
}
12161216
},
12171217
"parameters": {
@@ -1696,8 +1696,8 @@
16961696
"metadata": {
16971697
"_generator": {
16981698
"name": "bicep",
1699-
"version": "0.33.93.31351",
1700-
"templateHash": "3309828108890144070"
1699+
"version": "0.34.1.11899",
1700+
"templateHash": "8749313878807873763"
17011701
}
17021702
},
17031703
"parameters": {
@@ -1919,8 +1919,8 @@
19191919
"metadata": {
19201920
"_generator": {
19211921
"name": "bicep",
1922-
"version": "0.33.93.31351",
1923-
"templateHash": "1089111242708527718"
1922+
"version": "0.34.1.11899",
1923+
"templateHash": "16100001477502640669"
19241924
}
19251925
},
19261926
"parameters": {

0 commit comments

Comments
 (0)