|
1 | 1 | costs: |
2 | | - - cache_read_input_token_cost: 2.75e-8 |
| 2 | + - cache_read_input_audio_token_cost: 5.5e-8 |
| 3 | + cache_read_input_token_cost: 2.75e-8 |
3 | 4 | input_cost_per_audio_token: 5.5e-7 |
4 | 5 | input_cost_per_token: 2.75e-7 |
5 | 6 | input_cost_per_token_batches: 1.375e-7 |
6 | 7 | output_cost_per_token: 0.00000165 |
7 | 8 | output_cost_per_token_batches: 8.25e-7 |
8 | 9 | region: us |
9 | | - - cache_read_input_token_cost: 2.5e-8 |
| 10 | + - cache_read_input_audio_token_cost: 5e-8 |
| 11 | + cache_read_input_token_cost: 2.5e-8 |
10 | 12 | input_cost_per_audio_token: 5e-7 |
11 | 13 | input_cost_per_token: 2.5e-7 |
12 | 14 | input_cost_per_token_batches: 1.25e-7 |
13 | 15 | output_cost_per_token: 0.0000015 |
14 | 16 | output_cost_per_token_batches: 7.5e-7 |
15 | 17 | region: global |
16 | | - - cache_read_input_token_cost: 2.75e-8 |
| 18 | + - cache_read_input_audio_token_cost: 5.5e-8 |
| 19 | + cache_read_input_token_cost: 2.75e-8 |
17 | 20 | input_cost_per_audio_token: 5.5e-7 |
18 | 21 | input_cost_per_token: 2.75e-7 |
19 | 22 | input_cost_per_token_batches: 1.375e-7 |
@@ -48,8 +51,8 @@ model: google/gemini-3.1-flash-lite |
48 | 51 | provisioning: serverless |
49 | 52 | sources: |
50 | 53 | - https://docs.cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-1-flash-lite |
51 | | - - https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite-preview |
52 | | -status: preview |
| 54 | + - https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite |
| 55 | +status: active |
53 | 56 | supportedModes: |
54 | 57 | - chat |
55 | 58 | thinking: true |
0 commit comments