From 6e64e02f714a3e51293585116783cd2f3a9ba28f Mon Sep 17 00:00:00 2001 From: hiyouga Date: Fri, 12 Jan 2024 00:27:57 +0800 Subject: [PATCH] fix #2164 Former-commit-id: abe23bb4aca4fa571ebafc329ec9a9d457e37d41 --- src/llmtuner/train/dpo/trainer.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/llmtuner/train/dpo/trainer.py b/src/llmtuner/train/dpo/trainer.py index 132df189..97d80353 100644 --- a/src/llmtuner/train/dpo/trainer.py +++ b/src/llmtuner/train/dpo/trainer.py @@ -36,6 +36,7 @@ class CustomDPOTrainer(DPOTrainer): self.precompute_ref_log_probs = False self._precomputed_train_ref_log_probs = False self._precomputed_eval_ref_log_probs = False + self._peft_has_been_casted_to_bf16 = False self.ref_model = ref_model self.beta = beta