Former-commit-id: 23a8e64f1c47cd473c627effbe271233c136369c
This commit is contained in:
hiyouga
2024-02-21 21:55:14 +08:00
parent 67deefe527
commit a274900188
2 changed files with 3 additions and 2 deletions

View File

@@ -90,7 +90,7 @@ class RLHFArguments:
default=0.1,
metadata={"help": "The beta parameter for the DPO loss."},
)
dpo_loss: Optional[Literal["sigmoid", "hinge", "ipo", "kto"]] = field(
dpo_loss: Optional[Literal["sigmoid", "hinge", "ipo", "kto_pair"]] = field(
default="sigmoid",
metadata={"help": "The type of DPO loss to use."},
)