Skip to content

Commit 1634cdd

Browse files
committed
update tests
1 parent 20c02d3 commit 1634cdd

File tree

1 file changed

+15
-1
lines changed

1 file changed

+15
-1
lines changed

onnxruntime/test/testdata/onnx_backend_test_series_filters.jsonc

Lines changed: 15 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@
4141
"^test_attention_4d_with_past_and_present_qk_matmul_bias_4d_mask_causal*", // location of infinities
4242
"^test_attention_4d_attn_mask_3d_causal_expanded*", // webgpu
4343
"^test_attention_4d_diff_heads_mask4d_padded_kv*", // Need nonpad_kv_seqlen
44-
// TODO: support the following tests in Attention-cuda
44+
// TODO: support the following tests in Attention-cuda (softcap, softmax precision and qk_matmul_mode)
4545
"^test_attention_3d_diff_heads_sizes_softcap_cuda", // softcap not supported in Attention-cuda
4646
"^test_attention_4d_diff_heads_sizes_softcap_cuda", // softcap not supported in Attention-cuda
4747
"^test_attention_3d_softcap_cuda", // softcap not supported in Attention-cuda
@@ -66,6 +66,20 @@
6666
"^test_attention_4d_attn_mask_4d_causal_cuda",
6767
"^test_attention_4d_causal_cuda",
6868
"^test_attention_4d_diff_heads_sizes_causal_cuda",
69+
// GQA Attention-cuda does not support fp16 and 4d QKV
70+
"^test_attention_4d_gqa_with_past_and_present_fp16_cuda", // 4d QKV
71+
"^test_attention_4d_gqa_with_past_and_present_cuda", // fp32
72+
"^test_attention_4d_gqa_softcap_cuda", // fp32
73+
"^test_attention_4d_gqa_scaled_cuda", // fp32
74+
"^test_attention_4d_gqa_cuda", // fp32
75+
"^test_attention_3d_gqa_attn_mask_cuda", // fp32
76+
"^test_attention_3d_gqa_causal_cuda", // fp32
77+
"^test_attention_3d_gqa_cuda", // fp32
78+
"^test_attention_3d_gqa_scaled_cuda", // fp32
79+
"^test_attention_3d_gqa_softcap_cuda", // fp32
80+
"^test_attention_3d_gqa_with_past_and_present_cuda", // fp32
81+
"^test_attention_4d_gqa_attn_mask_cuda", // fp32
82+
"^test_attention_4d_gqa_causal_cuda", // fp32
6983
"^test_tensorscatter*", // TensorScatter(24) not implemented
7084
"^test_castlike_no_saturate_FLOAT_to_FLOAT8*", // ORT does not support ml_dtypes
7185
"^test_castlike_UINT4_to*", // ORT does not support ml_dtypes

0 commit comments

Comments
 (0)