File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 2424 tokenizer : null
2525 # Default: dataset built by `scripts/build_grpo_dataset.py`. Override per-run.
2626 train_files : results/grpo_dataset/v1/train.parquet
27- val_files : null
27+ # verl tries to LOAD a val dataset even with test_freq: -1, so point at
28+ # the train parquet to keep it happy. Validation logic itself is disabled
29+ # via test_freq + val_before_train, so this dataset is never iterated.
30+ val_files : results/grpo_dataset/v1/train.parquet
2831 prompt_key : prompt
2932 max_prompt_length : 1024
3033 max_response_length : 1024
@@ -86,7 +89,9 @@ actor_rollout_ref:
8689 ignore_eos : false
8790 enforce_eager : false
8891 free_cache_engine : true
89- load_format : dummy_dtensor
92+ # load_format inherited from ppo_trainer defaults (modern vLLM rejects the
93+ # old "dummy_dtensor" name). Let verl pick a compatible value for its
94+ # bundled vLLM version.
9095 tensor_model_parallel_size : 1
9196 max_num_batched_tokens : 8192
9297 max_num_seqs : 1024
Original file line number Diff line number Diff line change @@ -74,7 +74,8 @@ actor_rollout_ref:
7474 ignore_eos : false
7575 enforce_eager : false
7676 free_cache_engine : true
77- load_format : dummy_dtensor
77+ # load_format inherited from ppo_trainer defaults (modern vLLM rejects
78+ # the old "dummy_dtensor" name).
7879 tensor_model_parallel_size : 2 # split rollout across 2 GPUs
7980 max_num_batched_tokens : 8192
8081 max_num_seqs : 512
You can’t perform that action at this time.
0 commit comments