Former-commit-id: e86f20134b782c8f5c39ead292f8f7582038eb9e
This commit is contained in:
hiyouga 2024-07-19 01:17:37 +08:00
parent 3db5cf44ea
commit e2d9ab3591

View File

@ -30,17 +30,18 @@ TINY_DATA = os.environ.get("TINY_DATA", "llamafactory/tiny-supervised-dataset")
TRAIN_ARGS = {
"model_name_or_path": TINY_LLAMA,
"stage": "sft",
"do_predict": True,
"stage": "ppo",
"do_train": True,
"finetuning_type": "full",
"eval_dataset": "system_chat",
"reward_model": "",
"reward_model_type": "full",
"dataset": "system_chat",
"dataset_dir": "REMOTE:" + DEMO_DATA,
"template": "llama3",
"cutoff_len": 8192,
"overwrite_cache": True,
"output_dir": "dummy_dir",
"overwrite_output_dir": True,
"predict_with_generate": True,
"fp16": True,
}