44
44
run : bash scripts/amd_ci_install_dependency.sh
45
45
46
46
- name : Evaluate Accuracy
47
- timeout-minutes : 20
47
+ timeout-minutes : 30
48
48
run : |
49
49
bash scripts/amd_ci_exec.sh python3 test_eval_accuracy_large.py
50
50
bash scripts/amd_ci_exec.sh python3 test_eval_fp8_accuracy.py
70
70
run : bash scripts/amd_ci_install_dependency.sh
71
71
72
72
- name : Evaluate accuracy (TP=2)
73
- timeout-minutes : 20
73
+ timeout-minutes : 30
74
74
run : |
75
75
bash scripts/amd_ci_exec.sh python3 test_moe_eval_accuracy_large.py
76
76
94
94
run : bash scripts/amd_ci_install_dependency.sh
95
95
96
96
- name : MLA TEST
97
- timeout-minutes : 20
97
+ timeout-minutes : 30
98
98
run : |
99
99
bash scripts/amd_ci_exec.sh python3 test_mla.py
100
100
@@ -118,31 +118,26 @@ jobs:
118
118
run : bash scripts/amd_ci_install_dependency.sh
119
119
120
120
- name : Benchmark single latency
121
- timeout-minutes : 10
121
+ timeout-minutes : 20
122
122
run : |
123
123
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_bs1_small
124
124
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_bs1_default
125
125
126
126
- name : Benchmark online latency
127
- timeout-minutes : 10
127
+ timeout-minutes : 15
128
128
run : |
129
129
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_online_latency_default
130
130
131
131
- name : Benchmark offline throughput
132
- timeout-minutes : 10
132
+ timeout-minutes : 15
133
133
run : |
134
134
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_default
135
135
136
136
- name : Benchmark offline throughput (Non-streaming, small batch size)
137
- timeout-minutes : 10
137
+ timeout-minutes : 15
138
138
run : |
139
139
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_non_stream_small_batch_size
140
140
141
- - name : Benchmark online latency (EAGLE)
142
- timeout-minutes : 10
143
- run : |
144
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_online_latency_eagle
145
-
146
141
performance-test-1-gpu-part-2-amd :
147
142
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
148
143
github.event.pull_request.draft == false
@@ -163,17 +158,17 @@ jobs:
163
158
run : bash scripts/amd_ci_install_dependency.sh
164
159
165
160
- name : Benchmark offline throughput (w/o RadixAttention)
166
- timeout-minutes : 10
161
+ timeout-minutes : 15
167
162
run : |
168
163
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_without_radix_cache
169
164
170
165
- name : Benchmark offline throughput (w/ Triton)
171
- timeout-minutes : 10
166
+ timeout-minutes : 15
172
167
run : |
173
168
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_with_triton_attention_backend
174
169
175
170
- name : Benchmark offline throughput (w/ FP8)
176
- timeout-minutes : 10
171
+ timeout-minutes : 15
177
172
run : |
178
173
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_default_fp8
179
174
@@ -197,27 +192,27 @@ jobs:
197
192
run : bash scripts/amd_ci_install_dependency.sh
198
193
199
194
- name : Benchmark dummy grok (TP=2)
200
- timeout-minutes : 20
195
+ timeout-minutes : 30
201
196
run : |
202
197
bash scripts/amd_ci_exec.sh python3 models/test_dummy_grok_models.py
203
198
204
199
- name : Benchmark single latency (TP=2)
205
- timeout-minutes : 20
200
+ timeout-minutes : 25
206
201
run : |
207
202
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_tp2_bs1
208
203
209
204
- name : Benchmark single latency + torch.compile (TP=2)
210
- timeout-minutes : 20
205
+ timeout-minutes : 25
211
206
run : |
212
207
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_torch_compile_tp2_bs1
213
208
214
209
- name : Benchmark offline throughput (TP=2)
215
- timeout-minutes : 20
210
+ timeout-minutes : 25
216
211
run : |
217
212
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_moe_offline_throughput_default
218
213
219
214
- name : Benchmark offline throughput (w/o RadixAttention) (TP=2)
220
- timeout-minutes : 20
215
+ timeout-minutes : 25
221
216
run : |
222
217
bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_moe_offline_throughput_without_radix_cache
223
218
@@ -241,7 +236,7 @@ jobs:
241
236
run : bash scripts/amd_ci_install_dependency.sh
242
237
243
238
- name : Run test
244
- timeout-minutes : 30
239
+ timeout-minutes : 40
245
240
run : |
246
241
bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-amd
247
242
@@ -265,7 +260,7 @@ jobs:
265
260
run : bash scripts/amd_ci_install_dependency.sh
266
261
267
262
- name : Run test
268
- timeout-minutes : 30
263
+ timeout-minutes : 40
269
264
run : |
270
265
bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-2-gpu-amd
271
266
@@ -274,7 +269,7 @@ jobs:
274
269
github.event.pull_request.draft == false
275
270
strategy :
276
271
matrix :
277
- runner : [linux-mi300-gpu-8, linux-mi325-gpu-8 ]
272
+ runner : [linux-mi300-gpu-8]
278
273
runs-on : ${{matrix.runner}}
279
274
steps :
280
275
- name : Checkout code
@@ -289,7 +284,7 @@ jobs:
289
284
run : bash scripts/amd_ci_install_dependency.sh
290
285
291
286
- name : Run test
292
- timeout-minutes : 30
287
+ timeout-minutes : 40
293
288
run : |
294
289
bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-8-gpu-amd
295
290
0 commit comments