mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-11-06 02:42:15 +08:00
parent
518d9c4d8c
commit
970031b25c
@ -54,6 +54,7 @@ class CustomDPOTrainer(DPOTrainer):
|
||||
disable_dropout_in_model(ref_model)
|
||||
|
||||
self.finetuning_args = finetuning_args
|
||||
self.f_divergence_type = "reverse_kl"
|
||||
self.reference_free = False
|
||||
self.use_dpo_data_collator = True # hack to avoid warning
|
||||
self.generate_during_eval = False # disable at evaluation
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user