Skip to content

Commit 9347270

Browse files
authored
Update model configs [2026-02-15T00:00:25.137Z] (#56)
1 parent 686e9f5 commit 9347270

26 files changed

Lines changed: 249 additions & 6 deletions
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
model: deepseek.v3.2
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 6.2e-7
5+
output_cost_per_token: 0.00000185
6+
limits:
7+
max_tokens: 163840
8+
max_input_tokens: 163840
9+
max_output_tokens: 163840
10+
features: [function_calling]
11+
mode: chat
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
model: eu.deepseek.v3.2
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 7.4e-7
5+
output_cost_per_token: 0.00000222
6+
limits:
7+
max_tokens: 163840
8+
max_input_tokens: 163840
9+
max_output_tokens: 163840
10+
features: [function_calling]
11+
mode: chat
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
model: minimax.minimax-m2.1
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 3.e-7
5+
output_cost_per_token: 0.0000012
6+
limits:
7+
max_tokens: 8192
8+
max_input_tokens: 196000
9+
max_output_tokens: 8192
10+
features: [function_calling]
11+
mode: chat
Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,11 @@
11
model: moonshotai.kimi-k2.5
22
costs:
33
- region: '*'
4-
input_cost_per_token: 7.3e-7
5-
output_cost_per_token: 0.00000303
4+
input_cost_per_token: 6.e-7
5+
output_cost_per_token: 0.000003
66
limits:
77
max_tokens: 262144
88
max_input_tokens: 262144
99
max_output_tokens: 262144
10-
features: [function_calling]
10+
features: [function_calling, vision]
1111
mode: chat
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
model: nvidia.nemotron-nano-3-30b
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 6.e-8
5+
output_cost_per_token: 2.4e-7
6+
limits:
7+
max_tokens: 8192
8+
max_input_tokens: 262144
9+
max_output_tokens: 8192
10+
features: [function_calling]
11+
mode: chat
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
model: qwen.qwen3-coder-next
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 5.e-7
5+
output_cost_per_token: 0.0000012
6+
limits:
7+
max_tokens: 8192
8+
max_input_tokens: 262144
9+
max_output_tokens: 8192
10+
features: [function_calling]
11+
mode: chat
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
model: us.deepseek.v3.2
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 6.2e-7
5+
output_cost_per_token: 0.00000185
6+
limits:
7+
max_tokens: 163840
8+
max_input_tokens: 163840
9+
max_output_tokens: 163840
10+
features: [function_calling]
11+
mode: chat
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
model: zai.glm-4.7
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 6.e-7
5+
output_cost_per_token: 0.0000022
6+
limits:
7+
max_tokens: 128000
8+
max_input_tokens: 200000
9+
max_output_tokens: 128000
10+
features: [function_calling]
11+
mode: chat
Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
model: gemini-2.0-flash-lite-001
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 7.5e-8
5+
output_cost_per_token: 3.e-7
6+
cache_read_input_token_cost: 1.875e-8
7+
input_cost_per_audio_token: 7.5e-8
8+
limits:
9+
max_tokens: 4096
10+
max_input_tokens: 1048576
11+
max_output_tokens: 8192
12+
features: [function_calling, vision, audio_output, chat, image, pdf, doc]
13+
mode: chat
Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,12 @@
1+
model: gemini-2.5-flash-native-audio-latest
2+
costs:
3+
- region: '*'
4+
input_cost_per_token: 3.e-7
5+
output_cost_per_token: 0.0000025
6+
input_cost_per_audio_token: 0.000001
7+
limits:
8+
max_tokens: 8192
9+
max_input_tokens: 1048576
10+
max_output_tokens: 8192
11+
features: [audio_input, audio_output]
12+
mode: chat

0 commit comments

Comments
 (0)