This commit is contained in:
hiyouga
2024-07-03 02:31:50 +08:00
parent 71cdf8956e
commit 8b1172b910
3 changed files with 17 additions and 12 deletions

View File

@@ -54,7 +54,7 @@ def run_ppo(
reward_model = create_reward_model(model, model_args, finetuning_args)
# Initialize our Trainer
ppo_trainer = CustomPPOTrainer(
ppo_trainer: "CustomPPOTrainer" = CustomPPOTrainer(
model_args=model_args,
training_args=training_args,
finetuning_args=finetuning_args,