Skip to content

Commit 4b6d929

Browse files
authored
[CI][Bugfix] Update environment variables for test configurations in Buildkite YAML files to resolve HF timeout (vllm-project#2628)
Signed-off-by: wangyu <410167048@qq.com>
1 parent 694be6f commit 4b6d929

4 files changed

Lines changed: 20 additions & 35 deletions

File tree

.buildkite/test-merge.yml

Lines changed: 5 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,8 @@
1+
env:
2+
VLLM_WORKER_MULTIPROC_METHOD: spawn
3+
HF_HUB_DOWNLOAD_TIMEOUT: 300
4+
HF_HUB_ETAG_TIMEOUT: 60
5+
16
steps:
27
- label: "Simple Unit Test"
38
depends_on: upload-merge-pipeline
@@ -169,7 +174,6 @@ steps:
169174
commands:
170175
- |
171176
timeout 15m bash -c '
172-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
173177
pytest -s -v tests/engine/test_async_omni_engine_abort.py
174178
'
175179
agents:
@@ -191,7 +195,6 @@ steps:
191195
depends_on: upload-merge-pipeline
192196
commands:
193197
- export VLLM_LOGGING_LEVEL=DEBUG
194-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
195198
- pytest -s -v tests/e2e/offline_inference/test_qwen2_5_omni.py tests/e2e/online_serving/test_qwen2_5_omni.py -m "advanced_model" --run-level "advanced_model"
196199
agents:
197200
queue: "gpu_4_queue" # g6.12xlarge instance on AWS, has 4 L4 GPU
@@ -212,7 +215,6 @@ steps:
212215
- |
213216
timeout 20m bash -c '
214217
export VLLM_LOGGING_LEVEL=DEBUG
215-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
216218
export VLLM_ALLOW_LONG_MAX_MODEL_LEN="1"
217219
pytest -s -v tests/e2e/online_serving/test_qwen3_tts_customvoice.py tests/e2e/offline_inference/test_qwen3_tts_customvoice.py -m "advanced_model" --run-level "advanced_model"
218220
'
@@ -235,7 +237,6 @@ steps:
235237
- |
236238
timeout 20m bash -c '
237239
export VLLM_LOGGING_LEVEL=DEBUG
238-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
239240
export VLLM_ALLOW_LONG_MAX_MODEL_LEN="1"
240241
pytest -s -v tests/e2e/online_serving/test_qwen3_tts_base.py tests/e2e/offline_inference/test_qwen3_tts_base.py -m "advanced_model" --run-level "advanced_model"
241242
'
@@ -256,7 +257,6 @@ steps:
256257
timeout_in_minutes: 30
257258
depends_on: upload-merge-pipeline
258259
commands:
259-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
260260
- export VLLM_TEST_CLEAN_GPU_MEMORY="1"
261261
- pytest -s -v tests/e2e/offline_inference/test_qwen3_omni.py tests/e2e/online_serving/test_qwen3_omni.py tests/e2e/online_serving/test_mimo_audio.py -m "advanced_model" --run-level "advanced_model"
262262
agents:
@@ -297,7 +297,6 @@ steps:
297297
timeout_in_minutes: 20
298298
depends_on: upload-merge-pipeline
299299
commands:
300-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
301300
- pytest -s -v tests/e2e/online_serving/test_image_gen_edit.py
302301
agents:
303302
queue: "mithril-h100-pool"
@@ -340,7 +339,6 @@ steps:
340339
- |
341340
timeout 55m bash -c '
342341
set -e
343-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
344342
export VLLM_TEST_CLEAN_GPU_MEMORY=1
345343
export VLLM_IMAGE_FETCH_TIMEOUT=60
346344
pytest -s -v tests/e2e/offline_inference/test_bagel_text2img.py -m "advanced_model" --run-level "advanced_model" -k "shared_memory"
@@ -387,7 +385,6 @@ steps:
387385
- |
388386
timeout 20m bash -c '
389387
export VLLM_LOGGING_LEVEL=DEBUG
390-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
391388
pytest -s -v tests/e2e/online_serving/test_voxtral_tts.py tests/e2e/offline_inference/test_voxtral_tts.py -m "advanced_model" --run-level "advanced_model"
392389
'
393390
agents:

.buildkite/test-nightly-diffusion.yml

Lines changed: 5 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,11 @@
22
# buildkite-agent pipeline upload .buildkite/test-nightly-diffusion.yml
33
# from test-nightly.yml (step key: nightly-diffusion-model-test). Top-level groups are
44
# foldable in the Buildkite UI (Other / Wan / Qwen-Image).
5+
env:
6+
VLLM_WORKER_MULTIPROC_METHOD: spawn
7+
HF_HUB_DOWNLOAD_TIMEOUT: 300
8+
HF_HUB_ETAG_TIMEOUT: 60
9+
510
steps:
611
- group: ":card_index_dividers: Other Model Test"
712
key: nightly-other-model-test-group
@@ -10,7 +15,6 @@ steps:
1015
timeout_in_minutes: 120
1116
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
1217
commands:
13-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
1418
- pytest -s -v tests/e2e/online_serving/test_*_expansion.py -k "not test_wan22_expansion and not test_wan_2_1_vace_expansion and not test_qwen_image" -m "advanced_model and diffusion and H100" --run-level "advanced_model"
1519
agents:
1620
queue: "mithril-h100-pool"
@@ -50,7 +54,6 @@ steps:
5054
timeout_in_minutes: 60
5155
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
5256
commands:
53-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
5457
- pytest -s -v tests/e2e/online_serving/test_*_expansion.py -m "advanced_model and diffusion and L4" --run-level "advanced_model"
5558
agents:
5659
queue: "gpu_4_queue" # g6.12xlarge instance on AWS, has 4 L4 GPU
@@ -70,7 +73,6 @@ steps:
7073
timeout_in_minutes: 60
7174
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
7275
commands:
73-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
7476
- export VLLM_TEST_CLEAN_GPU_MEMORY="1"
7577
- pytest -s -v tests/examples/online_serving/test_text_to_image.py tests/examples/offline_inference/test_text_to_image.py -m "advanced_model and example and H100" --run-level "advanced_model"
7678
agents:
@@ -114,7 +116,6 @@ steps:
114116
timeout_in_minutes: 90
115117
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
116118
commands:
117-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
118119
- pytest -s -v tests/e2e/online_serving/test_wan22_expansion.py tests/e2e/online_serving/test_wan_2_1_vace_expansion.py -m "advanced_model" --run-level "advanced_model"
119120
agents:
120121
queue: "mithril-h100-pool"
@@ -155,7 +156,6 @@ steps:
155156
timeout_in_minutes: 180
156157
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
157158
commands:
158-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
159159
- pytest -s -v tests/e2e/accuracy/wan22_i2v/test_wan22_i2v_video_similarity.py --run-level advanced_model
160160
agents:
161161
queue: "mithril-h100-pool"
@@ -198,7 +198,6 @@ steps:
198198
timeout_in_minutes: 120
199199
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
200200
commands:
201-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
202201
- pytest -s -v tests/e2e/online_serving/test_qwen_image*_expansion.py -m "advanced_model and diffusion and H100" --run-level "advanced_model"
203202
agents:
204203
queue: "mithril-h100-pool"
@@ -239,7 +238,6 @@ steps:
239238
timeout_in_minutes: 60
240239
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
241240
commands:
242-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
243241
- pytest -s -v tests/e2e/accuracy/test_gebench_h100_smoke.py --run-level advanced_model --gebench-model Qwen/Qwen-Image-2512 --accuracy-judge-model QuantTrio/Qwen3-VL-30B-A3B-Instruct-AWQ --accuracy-gpu 0 --gebench-port 8093 --accuracy-workers 1
244242
- buildkite-agent artifact upload "tests/e2e/accuracy/artifacts/gebench_qwen-image-2512/summary*.json"
245243
agents:
@@ -281,7 +279,6 @@ steps:
281279
timeout_in_minutes: 60
282280
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
283281
commands:
284-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
285282
- pytest -s -v tests/e2e/accuracy/test_gedit_bench_h100_smoke.py --run-level advanced_model --gedit-model Qwen/Qwen-Image-Edit --accuracy-judge-model QuantTrio/Qwen3-VL-30B-A3B-Instruct-AWQ --accuracy-gpu 0 --gedit-port 8093 --gedit-samples-per-group 20 --accuracy-workers 1
286283
- buildkite-agent artifact upload "tests/e2e/accuracy/artifacts/gedit_scores_qwen-image-edit/qwen-image-edit_all_all_vie_score_*.csv"
287284
- buildkite-agent artifact upload "tests/e2e/accuracy/artifacts/gedit_scores_qwen-image-edit/qwen-image-edit_all_all_summary_*.json"
@@ -326,7 +323,6 @@ steps:
326323
timeout_in_minutes: 180
327324
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
328325
commands:
329-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
330326
- export DIFFUSION_BENCHMARK_DIR=tests/dfx/perf/results
331327
- export CACHE_DIT_VERSION=1.3.0
332328
- pytest -s -v tests/dfx/perf/scripts/run_diffusion_benchmark.py --config-file tests/dfx/perf/tests/test_qwen_image_vllm_omni.json

.buildkite/test-nightly.yml

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,8 @@
1+
env:
2+
VLLM_WORKER_MULTIPROC_METHOD: spawn
3+
HF_HUB_DOWNLOAD_TIMEOUT: 300
4+
HF_HUB_ETAG_TIMEOUT: 60
5+
16
steps:
27
# Group: collapses under one heading in the Buildkite UI; child steps still run in parallel.
38
- group: ":card_index_dividers: Omni Model Test"
@@ -8,7 +13,6 @@ steps:
813
depends_on: upload-nightly-pipeline
914
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
1015
commands:
11-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
1216
- pytest -s -v tests/e2e/online_serving/test_*_expansion.py -m "advanced_model and H100 and omni" --run-level "advanced_model"
1317
agents:
1418
queue: "mithril-h100-pool"
@@ -49,7 +53,6 @@ steps:
4953
depends_on: upload-nightly-pipeline
5054
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
5155
commands:
52-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
5356
- export VLLM_ALLOW_LONG_MAX_MODEL_LEN="1"
5457
- pytest -s -v tests/e2e/online_serving/test_*_expansion.py -m "advanced_model and L4 and omni" --run-level "advanced_model"
5558
agents:
@@ -71,7 +74,6 @@ steps:
7174
depends_on: upload-nightly-pipeline
7275
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
7376
commands:
74-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
7577
- export VLLM_ALLOW_LONG_MAX_MODEL_LEN="1"
7678
- pytest -s -v tests/examples/ -m "advanced_model and omni and L4" --run-level "advanced_model"
7779
agents:
@@ -93,7 +95,6 @@ steps:
9395
depends_on: upload-nightly-pipeline
9496
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
9597
commands:
96-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
9798
- pytest -s -v tests/examples/ -m "advanced_model and omni and H100" --run-level "advanced_model"
9899
agents:
99100
queue: "mithril-h100-pool"
@@ -135,7 +136,6 @@ steps:
135136
depends_on: upload-nightly-pipeline
136137
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
137138
commands:
138-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
139139
- export BENCHMARK_DIR=tests/dfx/perf/results
140140
- export VLLM_ALLOW_LONG_MAX_MODEL_LEN="1"
141141
- pytest -s -v tests/dfx/perf/scripts/run_benchmark.py
@@ -193,7 +193,6 @@ steps:
193193
depends_on: upload-nightly-pipeline
194194
if: build.env("NIGHTLY") == "1" || build.pull_request.labels includes "nightly-test"
195195
commands:
196-
- export VLLM_WORKER_MULTIPROC_METHOD=spawn
197196
- python tools/nightly/buildkite_testcase_statistics.py -o tests/dfx/perf/results/buildkite_testcase_statistics.html
198197
- buildkite-agent artifact upload "tests/dfx/perf/results/*.html"
199198
agents:

.buildkite/test-ready.yml

Lines changed: 5 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,8 @@
1+
env:
2+
VLLM_WORKER_MULTIPROC_METHOD: spawn
3+
HF_HUB_DOWNLOAD_TIMEOUT: 300
4+
HF_HUB_ETAG_TIMEOUT: 60
5+
16
steps:
27
- label: "Simple Unit Test"
38
depends_on: upload-ready-pipeline
@@ -173,7 +178,6 @@ steps:
173178
commands:
174179
- |
175180
timeout 15m bash -c '
176-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
177181
pytest -s -v tests/engine/test_async_omni_engine_abort.py
178182
'
179183
agents:
@@ -197,7 +201,6 @@ steps:
197201
- |
198202
timeout 17m bash -c '
199203
export VLLM_LOGGING_LEVEL=DEBUG
200-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
201204
pytest -s -v tests/e2e/online_serving/test_qwen2_5_omni.py -m "core_model" --run-level "core_model"
202205
'
203206
agents:
@@ -218,7 +221,6 @@ steps:
218221
commands:
219222
- |
220223
timeout 20m bash -c '
221-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
222224
pytest -s -v tests/e2e/online_serving/test_qwen3_omni.py -m "core_model" --run-level "core_model"
223225
'
224226
agents:
@@ -256,7 +258,6 @@ steps:
256258
- |
257259
timeout 30m bash -c '
258260
export VLLM_LOGGING_LEVEL=DEBUG
259-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
260261
pytest -s -v tests/e2e/online_serving/test_mimo_audio.py -m "core_model" --run-level "core_model"
261262
'
262263
agents:
@@ -299,7 +300,6 @@ steps:
299300
- |
300301
timeout 20m bash -c '
301302
export VLLM_LOGGING_LEVEL=DEBUG
302-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
303303
export VLLM_ALLOW_LONG_MAX_MODEL_LEN="1"
304304
pytest -s -v tests/e2e/online_serving/test_qwen3_tts_customvoice.py -m "core_model" --run-level "core_model"
305305
'
@@ -324,7 +324,6 @@ steps:
324324
- |
325325
timeout 20m bash -c '
326326
export VLLM_LOGGING_LEVEL=DEBUG
327-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
328327
pytest -s -v tests/e2e/online_serving/test_omnivoice.py -m "core_model" --run-level "core_model"
329328
'
330329
agents:
@@ -347,7 +346,6 @@ steps:
347346
- |
348347
timeout 20m bash -c '
349348
export VLLM_LOGGING_LEVEL=DEBUG
350-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
351349
pytest -s -v tests/e2e/online_serving/test_voxtral_tts.py -m "core_model" --run-level "core_model"
352350
'
353351
agents:
@@ -384,7 +382,6 @@ steps:
384382
# commands:
385383
# - |
386384
# timeout 20m bash -c '
387-
# export VLLM_WORKER_MULTIPROC_METHOD=spawn
388385
# pytest -s -v tests/e2e/online_serving/test_image_gen_edit.py
389386
# '
390387
# agents:
@@ -421,7 +418,6 @@ steps:
421418
commands:
422419
- |
423420
timeout 30m bash -c '
424-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
425421
export VLLM_TEST_CLEAN_GPU_MEMORY=1
426422
pytest -s -v tests/e2e/offline_inference/test_bagel_text2img.py -m "core_model" --run-level "core_model"
427423
'
@@ -464,7 +460,6 @@ steps:
464460
commands:
465461
- |
466462
timeout 30m bash -c '
467-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
468463
export VLLM_TEST_CLEAN_GPU_MEMORY=1
469464
pytest -s -v tests/e2e/offline_inference/test_bagel_img2img.py -m "core_model" --run-level "core_model"
470465
'
@@ -507,7 +502,6 @@ steps:
507502
commands:
508503
- |
509504
timeout 40m bash -c '
510-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
511505
export VLLM_TEST_CLEAN_GPU_MEMORY=1
512506
export VLLM_IMAGE_FETCH_TIMEOUT=60
513507
pytest -s -v tests/e2e/online_serving/test_bagel_online.py -m "core_model" --run-level "core_model"
@@ -552,7 +546,6 @@ steps:
552546
commands:
553547
- |
554548
timeout 20m bash -c '
555-
export VLLM_WORKER_MULTIPROC_METHOD=spawn
556549
pytest -s -v tests/e2e/online_serving/test_cosyvoice3_tts.py -m "core_model" --run-level "core_model"
557550
'
558551
agents:

0 commit comments

Comments
 (0)