Skip to content

Commit 50a4132

Browse files
fix: drop load_format=dummy_dtensor; modern vllm rejects it. let verl default win
1 parent 159e141 commit 50a4132

2 files changed

Lines changed: 9 additions & 3 deletions

File tree

configs/grpo_qwen1_5b.yaml

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,10 @@ data:
2424
tokenizer: null
2525
# Default: dataset built by `scripts/build_grpo_dataset.py`. Override per-run.
2626
train_files: results/grpo_dataset/v1/train.parquet
27-
val_files: null
27+
# verl tries to LOAD a val dataset even with test_freq: -1, so point at
28+
# the train parquet to keep it happy. Validation logic itself is disabled
29+
# via test_freq + val_before_train, so this dataset is never iterated.
30+
val_files: results/grpo_dataset/v1/train.parquet
2831
prompt_key: prompt
2932
max_prompt_length: 1024
3033
max_response_length: 1024
@@ -86,7 +89,9 @@ actor_rollout_ref:
8689
ignore_eos: false
8790
enforce_eager: false
8891
free_cache_engine: true
89-
load_format: dummy_dtensor
92+
# load_format inherited from ppo_trainer defaults (modern vLLM rejects the
93+
# old "dummy_dtensor" name). Let verl pick a compatible value for its
94+
# bundled vLLM version.
9095
tensor_model_parallel_size: 1
9196
max_num_batched_tokens: 8192
9297
max_num_seqs: 1024

configs/grpo_qwen7b.yaml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,8 @@ actor_rollout_ref:
7474
ignore_eos: false
7575
enforce_eager: false
7676
free_cache_engine: true
77-
load_format: dummy_dtensor
77+
# load_format inherited from ppo_trainer defaults (modern vLLM rejects
78+
# the old "dummy_dtensor" name).
7879
tensor_model_parallel_size: 2 # split rollout across 2 GPUs
7980
max_num_batched_tokens: 8192
8081
max_num_seqs: 512

0 commit comments

Comments
 (0)