mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-14 19:06:26 +08:00
fix #809
This commit is contained in:
@@ -42,7 +42,7 @@ class DPOPeftTrainer(PeftModelMixin, DPOTrainer):
|
|||||||
|
|
||||||
if ref_model is not None:
|
if ref_model is not None:
|
||||||
if self.is_deepspeed_enabled:
|
if self.is_deepspeed_enabled:
|
||||||
self.ref_model = self.accelerator._prepare_deepspeed(self.ref_model)
|
self.ref_model, = self.accelerator._prepare_deepspeed(self.ref_model)
|
||||||
self.ref_model.eval()
|
self.ref_model.eval()
|
||||||
else:
|
else:
|
||||||
self.ref_model = self.accelerator.prepare_model(self.ref_model, evaluation_mode=True)
|
self.ref_model = self.accelerator.prepare_model(self.ref_model, evaluation_mode=True)
|
||||||
|
|||||||
Reference in New Issue
Block a user