update examples

Former-commit-id: cce238f7d07919b79237bc9ab39265766c20f020
This commit is contained in:
hiyouga
2024-06-27 00:53:33 +08:00
parent 5a7cb9af4e
commit 8e5b4bddf4
4 changed files with 6 additions and 5 deletions

View File

@@ -7,7 +7,7 @@ do_train: true
finetuning_type: lora
lora_target: all
pref_beta: 0.1
pref_loss: sigmoid # [sigmoid (dpo), orpo, simpo]
pref_loss: sigmoid # choices: [sigmoid (dpo), orpo, simpo]
### dataset
dataset: dpo_en_demo