mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-08-04 12:42:51 +08:00
parent
772a1b16a1
commit
ca6a3bc76f
@ -42,7 +42,8 @@ def run_ppo(
|
|||||||
ppo_epochs=1,
|
ppo_epochs=1,
|
||||||
max_grad_norm=training_args.max_grad_norm,
|
max_grad_norm=training_args.max_grad_norm,
|
||||||
seed=training_args.seed,
|
seed=training_args.seed,
|
||||||
optimize_cuda_cache=True
|
optimize_cuda_cache=True,
|
||||||
|
accelerator_kwargs={"step_scheduler_with_optimizer": False}
|
||||||
)
|
)
|
||||||
|
|
||||||
if finetuning_args.ppo_score_norm:
|
if finetuning_args.ppo_score_norm:
|
||||||
|
Loading…
x
Reference in New Issue
Block a user