Skip to content

Commit f279cbb

Browse files
Merge branch 'main' into bot/update-google-vertex-20260625-021011
2 parents 56656dc + 38ee990 commit f279cbb

36 files changed

Lines changed: 186 additions & 14 deletions

providers/aws-bedrock/amazon.rerank-v1:0.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,9 +22,12 @@ removeParams:
2222
- "n"
2323
- stop
2424
- stream
25+
- reasoning_effort
2526
sources:
2627
- https://docs.aws.amazon.com/bedrock/latest/userguide/rerank-supported.html
2728
- https://docs.aws.amazon.com/bedrock/latest/userguide/rerank.html
29+
- https://docs.aws.amazon.com/bedrock/latest/userguide/rerank-pricing.html
30+
- https://docs.aws.amazon.com/bedrock/latest/userguide/rerank-use.html
2831
status: active
2932
supportedModes:
3033
- rerank

providers/aws-bedrock/apac.amazon.nova-micro-v1:0.yaml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -50,6 +50,8 @@ params:
5050
maxValue: 5000
5151
minValue: 1
5252
provisioning: serverless
53+
removeParams:
54+
- reasoning_effort
5355
sources:
5456
- https://docs.aws.amazon.com/nova/latest/userguide/what-is-nova.html
5557
- https://docs.aws.amazon.com/bedrock/latest/userguide/cross-region-inference-support.html

providers/aws-bedrock/au.anthropic.claude-sonnet-4-5-20250929-v1:0.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
costs:
22
- cache_creation_input_token_cost: 0.000004125
3+
cache_creation_input_token_cost_per_hour: 0.0000066
34
cache_read_input_token_cost: 3.3e-7
45
input_cost_per_token: 0.0000033
56
input_cost_per_token_batches: 0.00000165
@@ -21,6 +22,7 @@ costs:
2122
from: 200000
2223
pricing_mode: marginal
2324
- cache_creation_input_token_cost: 0.000004125
25+
cache_creation_input_token_cost_per_hour: 0.0000066
2426
cache_read_input_token_cost: 3.3e-7
2527
input_cost_per_token: 0.0000033
2628
input_cost_per_token_batches: 0.00000165
@@ -42,6 +44,7 @@ costs:
4244
from: 200000
4345
pricing_mode: marginal
4446
- cache_creation_input_token_cost: 0.000004125
47+
cache_creation_input_token_cost_per_hour: 0.0000066
4548
cache_read_input_token_cost: 3.3e-7
4649
input_cost_per_token: 0.0000033
4750
input_cost_per_token_batches: 0.00000165

providers/aws-bedrock/cohere.embed-english-v3.yaml

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,6 @@ limits:
3030
modalities:
3131
input:
3232
- text
33-
- image
3433
output:
3534
- embedding
3635
mode: embedding

providers/aws-bedrock/eu.amazon.nova-micro-v1:0.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -59,11 +59,11 @@ params:
5959
maxValue: 5000
6060
minValue: 1
6161
provisioning: serverless
62+
removeParams:
63+
- reasoning_effort
6264
sources:
6365
- https://docs.aws.amazon.com/nova/latest/userguide/what-is-nova.html
6466
- https://docs.aws.amazon.com/bedrock/latest/userguide/cross-region-inference-support.html
65-
- https://docs.aws.amazon.com/bedrock/latest/userguide/conversation-inference-supported-models-features.html
66-
- https://docs.aws.amazon.com/bedrock/latest/userguide/prompt-caching.html
6767
- https://docs.aws.amazon.com/bedrock/latest/userguide/model-card-amazon-nova-micro.html
6868
status: active
6969
supportedModes:

providers/aws-bedrock/eu.anthropic.claude-sonnet-4-6.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,7 @@ limits:
7474
context_window: 1000000
7575
max_output_tokens: 64000
7676
max_tokens: 64000
77-
tool_use_system_prompt_tokens: 346
77+
tool_use_system_prompt_tokens: 497
7878
modalities:
7979
input:
8080
- text

providers/aws-bedrock/global.anthropic.claude-opus-4-8.yaml

Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,14 @@ costs:
1515
output_cost_per_token: 2.5e-5
1616
output_cost_per_token_batches: 1.25e-5
1717
region: us-west-1
18+
- cache_creation_input_token_cost: 6.25e-6
19+
cache_creation_input_token_cost_per_hour: 1e-5
20+
cache_read_input_token_cost: 5e-7
21+
input_cost_per_token: 5e-6
22+
input_cost_per_token_batches: 2.5e-6
23+
output_cost_per_token: 2.5e-5
24+
output_cost_per_token_batches: 1.25e-5
25+
region: us-east-2
1826
- cache_creation_input_token_cost: 6.25e-6
1927
cache_creation_input_token_cost_per_hour: 1e-5
2028
cache_read_input_token_cost: 5e-7
@@ -39,6 +47,22 @@ costs:
3947
output_cost_per_token: 2.5e-5
4048
output_cost_per_token_batches: 1.25e-5
4149
region: mx-central-1
50+
- cache_creation_input_token_cost: 6.25e-6
51+
cache_creation_input_token_cost_per_hour: 1e-5
52+
cache_read_input_token_cost: 5e-7
53+
input_cost_per_token: 5e-6
54+
input_cost_per_token_batches: 2.5e-6
55+
output_cost_per_token: 2.5e-5
56+
output_cost_per_token_batches: 1.25e-5
57+
region: me-south-1
58+
- cache_creation_input_token_cost: 6.25e-6
59+
cache_creation_input_token_cost_per_hour: 1e-5
60+
cache_read_input_token_cost: 5e-7
61+
input_cost_per_token: 5e-6
62+
input_cost_per_token_batches: 2.5e-6
63+
output_cost_per_token: 2.5e-5
64+
output_cost_per_token_batches: 1.25e-5
65+
region: me-central-1
4266
- cache_creation_input_token_cost: 6.25e-6
4367
cache_creation_input_token_cost_per_hour: 1e-5
4468
cache_read_input_token_cost: 5e-7

providers/aws-bedrock/global.anthropic.claude-sonnet-4-5-20250929-v1:0.yaml

Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -439,6 +439,28 @@ costs:
439439
- cost_per_token: 0.0000225
440440
from: 200000
441441
pricing_mode: marginal
442+
- cache_creation_input_token_cost: 0.00000375
443+
cache_creation_input_token_cost_per_hour: 0.000006
444+
cache_read_input_token_cost: 3e-7
445+
input_cost_per_token: 0.000003
446+
input_cost_per_token_batches: 0.0000015
447+
output_cost_per_token: 0.000015
448+
output_cost_per_token_batches: 0.0000075
449+
region: ap-southeast-6
450+
tiered_pricing:
451+
cache_read:
452+
- cost_per_token: 6e-7
453+
from: 200000
454+
cache_write:
455+
- cost_per_token: 0.0000075
456+
from: 200000
457+
input:
458+
- cost_per_token: 0.000006
459+
from: 200000
460+
output:
461+
- cost_per_token: 0.0000225
462+
from: 200000
463+
pricing_mode: marginal
442464
- cache_creation_input_token_cost: 0.00000375
443465
cache_creation_input_token_cost_per_hour: 0.000006
444466
cache_read_input_token_cost: 3e-7

providers/aws-bedrock/google.gemma-3-27b-it.yaml

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,9 @@ costs:
2020
- input_cost_per_token: 2.7e-7
2121
output_cost_per_token: 4.5e-7
2222
region: eu-south-1
23+
- input_cost_per_token: 1.7e-7
24+
output_cost_per_token: 4.8e-7
25+
region: eu-central-1
2326
- input_cost_per_token: 2.369e-7
2427
output_cost_per_token: 3.914e-7
2528
region: ap-southeast-2
@@ -50,6 +53,8 @@ params:
5053
maxValue: 8192
5154
minValue: 1
5255
provisioning: serverless
56+
removeParams:
57+
- reasoning_effort
5358
sources:
5459
- https://docs.aws.amazon.com/bedrock/latest/userguide/model-card-google-gemma-3-27b-pt.html
5560
- https://ai.google.dev/gemma/docs/core

providers/aws-bedrock/luma.ray-v2:0.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ removeParams:
1818
- "n"
1919
- stop
2020
- stream
21+
- reasoning_effort
2122
sources:
2223
- https://lumalabs.ai/learning-hub
2324
- https://docs.aws.amazon.com/bedrock/latest/userguide/model-parameters-luma.html

0 commit comments

Comments
 (0)