support full-parameter PPO

Former-commit-id: ce78303600
This commit is contained in:
hiyouga
2023-11-16 02:08:04 +08:00
parent 0c1fab84f1
commit f441932bd1
20 changed files with 288 additions and 145 deletions

View File

@@ -51,7 +51,7 @@ def run_rm(
trainer.log_metrics("train", train_result.metrics)
trainer.save_metrics("train", train_result.metrics)
trainer.save_state()
if trainer.is_world_process_zero() and model_args.plot_loss:
if trainer.is_world_process_zero() and finetuning_args.plot_loss:
plot_loss(training_args.output_dir, keys=["loss", "eval_loss"])
# Evaluation