Former-commit-id: cdb0f34f10f5407e83766a8c5c9c5aff6af2a84e
This commit is contained in:
hiyouga 2024-07-19 01:17:37 +08:00
parent d0891f05fa
commit 488f392c81

View File

@ -30,17 +30,18 @@ TINY_DATA = os.environ.get("TINY_DATA", "llamafactory/tiny-supervised-dataset")
TRAIN_ARGS = {
"model_name_or_path": TINY_LLAMA,
"stage": "sft",
"do_predict": True,
"stage": "ppo",
"do_train": True,
"finetuning_type": "full",
"eval_dataset": "system_chat",
"reward_model": "",
"reward_model_type": "full",
"dataset": "system_chat",
"dataset_dir": "REMOTE:" + DEMO_DATA,
"template": "llama3",
"cutoff_len": 8192,
"overwrite_cache": True,
"output_dir": "dummy_dir",
"overwrite_output_dir": True,
"predict_with_generate": True,
"fp16": True,
}