Skip to content

Commit 1634e15

Browse files
Reduction of the MINI profiler UT execution time (vllm-project#52)
* Adjust the UT parameters to reduce the total time of the MINI profiler test Signed-off-by: chzhang <chaojun.zhang@intel.com> * Adjust the UT parameters to reduce the total time of the MINI profiler test Signed-off-by: chzhang <chaojun.zhang@intel.com> * Adjust the UT parameters to reduce the total time of the MINI profiler test Signed-off-by: chzhang <chaojun.zhang@intel.com> --------- Signed-off-by: chzhang <chaojun.zhang@intel.com>
1 parent 4085f86 commit 1634e15

6 files changed

Lines changed: 25 additions & 12 deletions

File tree

tests/fused_moe/test_fused_moe.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -30,9 +30,9 @@ def random_partition(size_a: int, target: int):
3030

3131
MINI_PYTEST_PARAMS = {
3232
"default": {
33-
"m,n,k": [(1, 256, 128), (4, 512, 256), (16, 512, 512)],
34-
"e": [16, 8],
35-
"topk": [1, 2],
33+
"m,n,k": [(1, 256, 128)],
34+
"e": [2],
35+
"topk": [1],
3636
"dtype": [torch.bfloat16]
3737
}
3838
}

tests/test_cache.py

Lines changed: 8 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -40,15 +40,19 @@
4040
MINI_PYTEST_PARAMS = {
4141
"default": {
4242
"num_tokens": [1],
43-
"head_size": [64, 80],
43+
"head_size": [8],
44+
"num_blocks": [4],
45+
"block_size": [8],
4446
},
4547
"test_concat_and_cache_mla": {
4648
"num_tokens": [1],
47-
"num_blocks": [32],
49+
"num_blocks": [4],
50+
"block_size": [8],
4851
},
4952
"test_gather_cache_mla": {
50-
"num_blocks": [32],
51-
"max_seq_len": [64],
53+
"num_blocks": [4],
54+
"block_size": [8],
55+
"max_seq_len": [4],
5256
},
5357
}
5458

tests/test_deepseek_scaling_rope.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,11 @@
1010
MINI_PYTEST_PARAMS = {
1111
"default": {
1212
"batch": [1],
13+
"seed": [123],
14+
"q_num_head,k_num_head": [(16, 1)],
15+
"rotary_dim": [64],
16+
"q_head_pad,k_head_pad": [(0, 0)],
17+
"is_neox": [True],
1318
},
1419
}
1520

tests/test_fp8_quant.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -132,8 +132,8 @@ def seed_everything(seed):
132132
#override pytest parameters when enable mini pytest
133133
MINI_PYTEST_PARAMS = {
134134
"default": {
135-
"num_tokens": [1, 7, 83],
136-
"hidden_size": [1, 2, 3, 4, 16],
135+
"num_tokens": [1],
136+
"hidden_size": [1],
137137
},
138138
}
139139

tests/test_grouped_topk.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,11 @@
99
#override pytest parameters when enable mini pytest
1010
MINI_PYTEST_PARAMS = {
1111
"default": {
12-
"n_hidden": [128, 256],
12+
"n_hidden": [4],
13+
"n_token": [1],
14+
"routed_scaling_factor": [1.0],
15+
"scoring_func": ["softmax"],
16+
"renormalize": [True],
1317
},
1418
}
1519

tests/test_rotary_embedding.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -34,9 +34,9 @@ def rotary_embedding_opcheck(rot,
3434
#override pytest parameters when enable mini pytest
3535
MINI_PYTEST_PARAMS = {
3636
"default": {
37-
"max_position": [11, 256],
37+
"max_position": [11],
3838
"head_size": [32],
39-
"seq_len": [11, 128],
39+
"seq_len": [11],
4040
},
4141
}
4242

0 commit comments

Comments
 (0)