fix bug in data loader, support dpo eval

Former-commit-id: f4f3dcff990468a2fa864b7176adcebbcf16dac9
This commit is contained in:
hiyouga
2023-11-03 00:34:26 +08:00
parent 065021d82a
commit 217fde0918
3 changed files with 9 additions and 2 deletions

View File

@@ -30,6 +30,7 @@ class CustomDPOTrainer(DPOTrainer):
self.is_encoder_decoder = model.config.is_encoder_decoder
self.ref_model = ref_model
self.use_dpo_data_collator = True # hack to avoid warning
self.generate_during_eval = False # disable at evaluation
self.label_pad_token_id = IGNORE_INDEX
self.padding_value = 0
self.beta = beta