Former-commit-id: 81176fe226da89eace89cb202bad68e73b7c2a02
This commit is contained in:
fzc8578
2025-01-04 11:11:15 +08:00
parent 5504b5254c
commit 2c120aa0df
7 changed files with 164 additions and 2 deletions

View File

@@ -149,6 +149,13 @@ class MultiModalDataCollatorForSeq2Seq(DataCollatorForSeq2Seq):
features.update(mm_inputs)
if isinstance(features.get("pixel_values"), list): # for pixtral inputs
features = features.data # use default_collate() instead of BatchEncoding.to()
if "image_bound" in features:
input_ids, position_ids = features['input_ids'], features['position_ids']
features['position_ids'] = F.pad(position_ids, (0, input_ids.shape[-1] - position_ids.shape[-1]))
new_features = {}
new_features.update({"data": features})
new_features.update(features)
features = new_features
return features