Skip to content

Commit 90d18a6

Browse files
committed
Use same measuring approach
1 parent 63d8f2a commit 90d18a6

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

benchmarks/bench_trtllm_gen_mla.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -82,7 +82,7 @@ def bench_trtllm_mla(batch_size, q_len_per_request, seq_len, page_size, dtype):
8282
bmm1_scale=1.0 / ((128 + 64) ** 0.5),
8383
bmm2_scale=1.0,
8484
)
85-
# benchmark using CUPTI
85+
# benchmark
8686
measurements = bench_gpu_time(
8787
lambda: flashinfer.decode.trtllm_batch_decode_with_kv_cache_mla(
8888
query=query,

0 commit comments

Comments
 (0)