Skip to content

Commit ad6629a

Browse files
models-bot[bot]Truefoundry Models Bot
andauthored
feat(google-vertex): update model YAMLs [bot] (#1298)
Co-authored-by: Truefoundry Models Bot <truefoundry-models-bot@users.noreply.github.com>
1 parent c8aa264 commit ad6629a

1 file changed

Lines changed: 8 additions & 5 deletions

File tree

providers/google-vertex/google/gemini-3.1-flash-lite.yaml

Lines changed: 8 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,19 +1,22 @@
11
costs:
2-
- cache_read_input_token_cost: 2.75e-8
2+
- cache_read_input_audio_token_cost: 5.5e-8
3+
cache_read_input_token_cost: 2.75e-8
34
input_cost_per_audio_token: 5.5e-7
45
input_cost_per_token: 2.75e-7
56
input_cost_per_token_batches: 1.375e-7
67
output_cost_per_token: 0.00000165
78
output_cost_per_token_batches: 8.25e-7
89
region: us
9-
- cache_read_input_token_cost: 2.5e-8
10+
- cache_read_input_audio_token_cost: 5e-8
11+
cache_read_input_token_cost: 2.5e-8
1012
input_cost_per_audio_token: 5e-7
1113
input_cost_per_token: 2.5e-7
1214
input_cost_per_token_batches: 1.25e-7
1315
output_cost_per_token: 0.0000015
1416
output_cost_per_token_batches: 7.5e-7
1517
region: global
16-
- cache_read_input_token_cost: 2.75e-8
18+
- cache_read_input_audio_token_cost: 5.5e-8
19+
cache_read_input_token_cost: 2.75e-8
1720
input_cost_per_audio_token: 5.5e-7
1821
input_cost_per_token: 2.75e-7
1922
input_cost_per_token_batches: 1.375e-7
@@ -48,8 +51,8 @@ model: google/gemini-3.1-flash-lite
4851
provisioning: serverless
4952
sources:
5053
- https://docs.cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-1-flash-lite
51-
- https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite-preview
52-
status: preview
54+
- https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite
55+
status: active
5356
supportedModes:
5457
- chat
5558
thinking: true

0 commit comments

Comments
 (0)