Skip to content

Commit 6cabcda

Browse files
committed
Update model configs [2026-02-04T09:27:51.298Z]
1 parent 945f8ee commit 6cabcda

462 files changed

Lines changed: 3787 additions & 766 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
model: azure-tts-hd
2+
costs:
3+
input_cost_per_character: 0.00003
4+
mode: audio_speech
5+
defaultRegion: speech
6+
original_provider: azure
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
model: azure-tts
2+
costs:
3+
input_cost_per_character: 0.000015
4+
mode: audio_speech
5+
defaultRegion: speech
6+
original_provider: azure
Lines changed: 8 additions & 46 deletions
Original file line numberDiff line numberDiff line change
@@ -1,53 +1,15 @@
11
model: gpt-4.1-2025-04-14
22
costs:
3-
input_cost_per_token: 0.000002
4-
output_cost_per_token: 0.000008
5-
input_cost_per_token_batches: 0.000001
6-
output_cost_per_token_batches: 0.000004
7-
cache_read_input_token_cost: 5.e-7
3+
input_cost_per_token: 0.0000022
4+
output_cost_per_token: 0.0000088
5+
input_cost_per_token_batches: 0.0000011
6+
output_cost_per_token_batches: 0.0000044
7+
cache_read_input_token_cost: 5.5e-7
88
limits:
9-
max_tokens: 4096
9+
max_tokens: 32768
1010
max_input_tokens: 1047576
1111
max_output_tokens: 32768
12-
features: [function_calling, parallel_function_calling, vision, chat, image]
13-
params:
14-
- key: max_completion_tokens
15-
defaultValue: 1000
16-
minValue: 1
17-
maxValue: 32768
18-
- key: response_format
19-
defaultValue: null
20-
options:
21-
- value: null
22-
name: Text
23-
- value: json_object
24-
name: JSON Object
25-
schema:
26-
type: object
27-
properties:
28-
type:
29-
type: string
30-
value: json_object
31-
- value: json_schema
32-
name: JSON Schema
33-
schema:
34-
type: object
35-
properties:
36-
type:
37-
type: string
38-
value: json_schema
39-
json_schema:
40-
type: object
41-
params:
42-
key: json_schema
43-
defaultValue: null
44-
type: json
45-
skipValues:
46-
- null
47-
skipValues:
48-
- null
49-
type: string
50-
removeParams:
51-
- max_tokens
12+
features: [function_calling, parallel_function_calling, vision]
5213
mode: chat
14+
defaultRegion: us
5315
original_provider: azure
Lines changed: 8 additions & 46 deletions
Original file line numberDiff line numberDiff line change
@@ -1,53 +1,15 @@
11
model: gpt-4.1-mini-2025-04-14
22
costs:
3-
input_cost_per_token: 4.e-7
4-
output_cost_per_token: 0.0000016
5-
input_cost_per_token_batches: 2.e-7
6-
output_cost_per_token_batches: 8.e-7
7-
cache_read_input_token_cost: 1.e-7
3+
input_cost_per_token: 4.4e-7
4+
output_cost_per_token: 0.00000176
5+
input_cost_per_token_batches: 2.2e-7
6+
output_cost_per_token_batches: 8.8e-7
7+
cache_read_input_token_cost: 1.1e-7
88
limits:
9-
max_tokens: 4096
9+
max_tokens: 32768
1010
max_input_tokens: 1047576
1111
max_output_tokens: 32768
12-
features: [function_calling, parallel_function_calling, vision, chat, image]
13-
params:
14-
- key: max_completion_tokens
15-
defaultValue: 1000
16-
minValue: 1
17-
maxValue: 32768
18-
- key: response_format
19-
defaultValue: null
20-
options:
21-
- value: null
22-
name: Text
23-
- value: json_object
24-
name: JSON Object
25-
schema:
26-
type: object
27-
properties:
28-
type:
29-
type: string
30-
value: json_object
31-
- value: json_schema
32-
name: JSON Schema
33-
schema:
34-
type: object
35-
properties:
36-
type:
37-
type: string
38-
value: json_schema
39-
json_schema:
40-
type: object
41-
params:
42-
key: json_schema
43-
defaultValue: null
44-
type: json
45-
skipValues:
46-
- null
47-
skipValues:
48-
- null
49-
type: string
50-
removeParams:
51-
- max_tokens
12+
features: [function_calling, parallel_function_calling, vision]
5213
mode: chat
14+
defaultRegion: us
5315
original_provider: azure
Lines changed: 7 additions & 45 deletions
Original file line numberDiff line numberDiff line change
@@ -1,53 +1,15 @@
11
model: gpt-4.1-nano-2025-04-14
22
costs:
3-
input_cost_per_token: 1.e-7
4-
output_cost_per_token: 4.e-7
5-
input_cost_per_token_batches: 5.e-8
6-
output_cost_per_token_batches: 2.e-7
3+
input_cost_per_token: 1.1e-7
4+
output_cost_per_token: 4.4e-7
5+
input_cost_per_token_batches: 6.e-8
6+
output_cost_per_token_batches: 2.2e-7
77
cache_read_input_token_cost: 2.5e-8
88
limits:
9-
max_tokens: 4096
9+
max_tokens: 32768
1010
max_input_tokens: 1047576
1111
max_output_tokens: 32768
12-
features: [function_calling, parallel_function_calling, vision, chat, image]
13-
params:
14-
- key: max_completion_tokens
15-
defaultValue: 1000
16-
minValue: 1
17-
maxValue: 32768
18-
- key: response_format
19-
defaultValue: null
20-
options:
21-
- value: null
22-
name: Text
23-
- value: json_object
24-
name: JSON Object
25-
schema:
26-
type: object
27-
properties:
28-
type:
29-
type: string
30-
value: json_object
31-
- value: json_schema
32-
name: JSON Schema
33-
schema:
34-
type: object
35-
properties:
36-
type:
37-
type: string
38-
value: json_schema
39-
json_schema:
40-
type: object
41-
params:
42-
key: json_schema
43-
defaultValue: null
44-
type: json
45-
skipValues:
46-
- null
47-
skipValues:
48-
- null
49-
type: string
50-
removeParams:
51-
- max_tokens
12+
features: [function_calling, parallel_function_calling, vision]
5213
mode: chat
14+
defaultRegion: us
5315
original_provider: azure
Lines changed: 6 additions & 47 deletions
Original file line numberDiff line numberDiff line change
@@ -1,54 +1,13 @@
11
model: gpt-4o-2024-08-06
22
costs:
3-
input_cost_per_token: 0.0000025
4-
output_cost_per_token: 0.00001
5-
cache_read_input_token_cost: 0.00000125
3+
input_cost_per_token: 0.00000275
4+
output_cost_per_token: 0.000011
5+
cache_read_input_token_cost: 0.000001375
66
limits:
7+
max_tokens: 16384
78
max_input_tokens: 128000
89
max_output_tokens: 16384
9-
features: [function_calling, parallel_function_calling, vision, chat, image]
10-
params:
11-
- key: max_tokens
12-
maxValue: 16384
13-
- key: response_format
14-
defaultValue: null
15-
options:
16-
- value: null
17-
name: Text
18-
- value: json_object
19-
name: JSON Object
20-
schema:
21-
type: object
22-
properties:
23-
type:
24-
type: string
25-
value: json_object
26-
- value: json_schema
27-
name: JSON Schema
28-
schema:
29-
type: object
30-
properties:
31-
type:
32-
type: string
33-
value: json_schema
34-
json_schema:
35-
type: object
36-
params:
37-
key: json_schema
38-
defaultValue: null
39-
type: json
40-
skipValues:
41-
- null
42-
skipValues:
43-
- null
44-
type: string
45-
- key: frequency_penalty
46-
defaultValue: 0
47-
minValue: -2
48-
maxValue: 2
49-
- key: presence_penalty
50-
defaultValue: 0
51-
minValue: -2
52-
maxValue: 2
10+
features: [function_calling, parallel_function_calling, vision]
5311
mode: chat
12+
defaultRegion: us
5413
original_provider: azure

providers/azure-openai/gpt-4o-2024-11-20.yaml

Lines changed: 4 additions & 29 deletions
Original file line numberDiff line numberDiff line change
@@ -2,37 +2,12 @@ model: gpt-4o-2024-11-20
22
costs:
33
input_cost_per_token: 0.00000275
44
output_cost_per_token: 0.000011
5-
cache_read_input_token_cost: 0.00000125
5+
cache_creation_input_token_cost: 0.00000138
66
limits:
7+
max_tokens: 16384
78
max_input_tokens: 128000
89
max_output_tokens: 16384
9-
features: [function_calling, parallel_function_calling, vision, chat, image]
10-
params:
11-
- key: max_tokens
12-
maxValue: 16384
13-
- key: response_format
14-
defaultValue: null
15-
options:
16-
- value: null
17-
name: Text
18-
- value: json_object
19-
name: JSON Object
20-
schema:
21-
type: object
22-
properties:
23-
type:
24-
type: string
25-
value: json_object
26-
skipValues:
27-
- null
28-
type: string
29-
- key: frequency_penalty
30-
defaultValue: 0
31-
minValue: -2
32-
maxValue: 2
33-
- key: presence_penalty
34-
defaultValue: 0
35-
minValue: -2
36-
maxValue: 2
10+
features: [function_calling, parallel_function_calling, vision]
3711
mode: chat
12+
defaultRegion: us
3813
original_provider: azure

providers/azure-openai/gpt-4o-mini-2024-07-18.yaml

Lines changed: 4 additions & 45 deletions
Original file line numberDiff line numberDiff line change
@@ -2,53 +2,12 @@ model: gpt-4o-mini-2024-07-18
22
costs:
33
input_cost_per_token: 1.65e-7
44
output_cost_per_token: 6.6e-7
5-
cache_read_input_token_cost: 7.5e-8
5+
cache_read_input_token_cost: 8.3e-8
66
limits:
7+
max_tokens: 16384
78
max_input_tokens: 128000
89
max_output_tokens: 16384
9-
features: [function_calling, parallel_function_calling, vision, chat, image]
10-
params:
11-
- key: max_tokens
12-
maxValue: 16384
13-
- key: response_format
14-
defaultValue: null
15-
options:
16-
- value: null
17-
name: Text
18-
- value: json_object
19-
name: JSON Object
20-
schema:
21-
type: object
22-
properties:
23-
type:
24-
type: string
25-
value: json_object
26-
- value: json_schema
27-
name: JSON Schema
28-
schema:
29-
type: object
30-
properties:
31-
type:
32-
type: string
33-
value: json_schema
34-
json_schema:
35-
type: object
36-
params:
37-
key: json_schema
38-
defaultValue: null
39-
type: json
40-
skipValues:
41-
- null
42-
skipValues:
43-
- null
44-
type: string
45-
- key: frequency_penalty
46-
defaultValue: 0
47-
minValue: -2
48-
maxValue: 2
49-
- key: presence_penalty
50-
defaultValue: 0
51-
minValue: -2
52-
maxValue: 2
10+
features: [function_calling, parallel_function_calling, vision]
5311
mode: chat
12+
defaultRegion: us
5413
original_provider: azure

0 commit comments

Comments
 (0)