mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-14 19:06:26 +08:00
update project_kwargs for ppo config
This commit is contained in:
@@ -61,6 +61,7 @@ def run_ppo(
|
|||||||
use_score_norm=finetuning_args.ppo_score_norm,
|
use_score_norm=finetuning_args.ppo_score_norm,
|
||||||
whiten_rewards=finetuning_args.ppo_whiten_rewards,
|
whiten_rewards=finetuning_args.ppo_whiten_rewards,
|
||||||
accelerator_kwargs={"step_scheduler_with_optimizer": False},
|
accelerator_kwargs={"step_scheduler_with_optimizer": False},
|
||||||
|
project_kwargs={"logging_dir": training_args.logging_dir},
|
||||||
)
|
)
|
||||||
|
|
||||||
# Create optimizer and scheduler
|
# Create optimizer and scheduler
|
||||||
|
|||||||
Reference in New Issue
Block a user