Update finetuning_args.py

Former-commit-id: b24635d22b
This commit is contained in:
Yuchen Han
2023-11-17 00:15:51 -08:00
committed by GitHub
parent 0d2262ffd0
commit ec910a87c0

View File

@@ -74,6 +74,10 @@ class RLHFArguments:
default=None,
metadata={"help": "Log with either 'wandb' or 'tensorboard' in PPO training."}
)
ppo_epochs: Optional[int] = field(
default=4,
metadata={"help": "Number of optimisation epochs per batch of samples"},
)
ppo_score_norm: Optional[bool] = field(
default=False,
metadata={"help": "Use score normalization in PPO training."}