release v0.2.2, fix #1478 #1466

This commit is contained in:
hiyouga
2023-11-13 23:09:05 +08:00
parent 87390ae3b7
commit 35cc1e28f6
3 changed files with 10 additions and 2 deletions

View File

@@ -136,7 +136,7 @@ class Runner:
args["upcast_layernorm"] = True
if args["stage"] == "ppo":
args["reward_model"] = get("train.reward_model")
args["reward_model"] = get_save_dir(get("top.model_name"), get("top.finetuning_type"), get("train.reward_model"))
if args["stage"] == "dpo":
args["dpo_beta"] = get("train.dpo_beta")