update dpo examples

This commit is contained in:
hiyouga 2024-05-27 19:56:04 +08:00
parent efa4b196ca
commit 30e1c8e745
1 changed files with 1 additions and 0 deletions

View File

@ -6,6 +6,7 @@ stage: dpo
do_train: true
finetuning_type: lora
lora_target: q_proj,v_proj
pref_beta: 0.1
pref_loss: sigmoid # [sigmoid (dpo), orpo, simpo]
### dataset