update ppo trainer

2025-12-16 20:00:36 +08:00 · 2023-08-02 18:46:41 +08:00
parent 286f7be346
commit b5ba87952a
2 changed files with 46 additions and 44 deletions
--- a/src/llmtuner/tuner/core/trainer.py
+++ b/src/llmtuner/tuner/core/trainer.py
@@ -47,7 +47,6 @@ class PeftTrainer(Seq2SeqTrainer):
        logger.info(f"Saving model checkpoint to {output_dir}")

        model = unwrap_model(self.model)
-
        if isinstance(model, PreTrainedModelWrapper):
            # Custom state dict: https://github.com/lvwerra/trl/blob/v0.4.7/trl/models/modeling_value_head.py#L200
            model_state_dict = state_dict or model.state_dict()