update examples

Former-commit-id: d417e63f92
This commit is contained in:
hiyouga
2024-06-27 00:53:33 +08:00
parent f2425cb4ed
commit 6e03536dca
4 changed files with 6 additions and 5 deletions

View File

@@ -7,7 +7,7 @@ do_train: true
finetuning_type: lora
lora_target: all
pref_beta: 0.1
pref_loss: sigmoid # [sigmoid (dpo), orpo, simpo]
pref_loss: sigmoid # choices: [sigmoid (dpo), orpo, simpo]
### dataset
dataset: dpo_en_demo