mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-10-16 16:48:11 +08:00
parent
f95f6ec009
commit
6e64e02f71
@ -36,6 +36,7 @@ class CustomDPOTrainer(DPOTrainer):
|
|||||||
self.precompute_ref_log_probs = False
|
self.precompute_ref_log_probs = False
|
||||||
self._precomputed_train_ref_log_probs = False
|
self._precomputed_train_ref_log_probs = False
|
||||||
self._precomputed_eval_ref_log_probs = False
|
self._precomputed_eval_ref_log_probs = False
|
||||||
|
self._peft_has_been_casted_to_bf16 = False
|
||||||
|
|
||||||
self.ref_model = ref_model
|
self.ref_model = ref_model
|
||||||
self.beta = beta
|
self.beta = beta
|
||||||
|
Loading…
x
Reference in New Issue
Block a user