We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3db5cf4 commit e2d9ab3Copy full SHA for e2d9ab3
1 file changed
tests/data/processors/test_unsupervised.py
@@ -30,17 +30,18 @@
30
31
TRAIN_ARGS = {
32
"model_name_or_path": TINY_LLAMA,
33
- "stage": "sft",
34
- "do_predict": True,
+ "stage": "ppo",
+ "do_train": True,
35
"finetuning_type": "full",
36
- "eval_dataset": "system_chat",
+ "reward_model": "",
37
+ "reward_model_type": "full",
38
+ "dataset": "system_chat",
39
"dataset_dir": "REMOTE:" + DEMO_DATA,
40
"template": "llama3",
41
"cutoff_len": 8192,
42
"overwrite_cache": True,
43
"output_dir": "dummy_dir",
44
"overwrite_output_dir": True,
- "predict_with_generate": True,
45
"fp16": True,
46
}
47
0 commit comments