[trainer] fix vlm loss for transformers 4.49 (#7448)

2025-03-24 10:24:05 +08:00
parent 3612946dd9
commit 7203365b80
5 changed files with 21 additions and 4 deletions
--- a/src/llamafactory/train/dpo/trainer.py
+++ b/src/llamafactory/train/dpo/trainer.py
@@ -128,9 +128,9 @@ class CustomDPOTrainer(DPOTrainer):
        return super()._get_train_sampler()

    @override
-    def get_batch_samples(self, epoch_iterator, num_batches, *args, **kwargs):
+    def get_batch_samples(self, *args, **kwargs):
        r"""Replace the method of DPO Trainer with the one of the standard Trainer."""
-        return Trainer.get_batch_samples(self, epoch_iterator, num_batches, *args, **kwargs)
+        return Trainer.get_batch_samples(self, *args, **kwargs)

    def odds_ratio_loss(self, chosen_logps: "torch.Tensor", rejected_logps: "torch.Tensor") -> "torch.Tensor":
        r"""Compute ORPO's odds ratio (OR) loss for batched log probabilities of the policy model."""
--- a/src/llamafactory/train/kto/trainer.py
+++ b/src/llamafactory/train/kto/trainer.py
@@ -127,9 +127,9 @@ class CustomKTOTrainer(KTOTrainer):
        return Trainer._get_train_sampler(self)

    @override
-    def get_batch_samples(self, epoch_iterator, num_batches, *args, **kwargs):
+    def get_batch_samples(self, *args, **kwargs):
        r"""Replace the method of KTO Trainer with the one of the standard Trainer."""
-        return Trainer.get_batch_samples(self, epoch_iterator, num_batches, *args, **kwargs)
+        return Trainer.get_batch_samples(self, *args, **kwargs)

    @override
    def forward(
--- a/src/llamafactory/train/pt/trainer.py
+++ b/src/llamafactory/train/pt/trainer.py
@@ -70,3 +70,7 @@ class CustomTrainer(Trainer):
            return torch.utils.data.SequentialSampler(self.train_dataset)

        return super()._get_train_sampler()
+
+    @override
+    def compute_loss(self, model, inputs, *args, **kwargs):
+        return super().compute_loss(model, inputs, *args, **kwargs)
--- a/src/llamafactory/train/sft/trainer.py
+++ b/src/llamafactory/train/sft/trainer.py
@@ -59,6 +59,9 @@ class CustomSeq2SeqTrainer(Seq2SeqTrainer):
            self.processing_class: PreTrainedTokenizer = kwargs.get("tokenizer")

        super().__init__(**kwargs)
+        if processor is not None:
+            self.model_accepts_loss_kwargs = False
+
        self.finetuning_args = finetuning_args
        if gen_kwargs is not None:
            # https://github.com/huggingface/transformers/blob/v4.45.0/src/transformers/trainer_seq2seq.py#L287
@@ -93,6 +96,10 @@ class CustomSeq2SeqTrainer(Seq2SeqTrainer):

        return super()._get_train_sampler()

+    @override
+    def compute_loss(self, model, inputs, *args, **kwargs):
+        return super().compute_loss(model, inputs, *args, **kwargs)
+
    @override
    def prediction_step(
        self,