fix #4742
This commit is contained in:
parent
86b1594823
commit
2f09520c0d
|
@ -54,6 +54,7 @@ class CustomDPOTrainer(DPOTrainer):
|
||||||
disable_dropout_in_model(ref_model)
|
disable_dropout_in_model(ref_model)
|
||||||
|
|
||||||
self.finetuning_args = finetuning_args
|
self.finetuning_args = finetuning_args
|
||||||
|
self.f_divergence_type = "reverse_kl"
|
||||||
self.reference_free = False
|
self.reference_free = False
|
||||||
self.use_dpo_data_collator = True # hack to avoid warning
|
self.use_dpo_data_collator = True # hack to avoid warning
|
||||||
self.generate_during_eval = False # disable at evaluation
|
self.generate_during_eval = False # disable at evaluation
|
||||||
|
|
Loading…
Reference in New Issue