Former-commit-id: fede563aeb716ba5d1e368fd3e1182e4e580d248
This commit is contained in:
fzc8578
2025-01-10 20:01:22 +08:00
parent 8c2a712247
commit 9e972bc9ec
5 changed files with 45 additions and 13 deletions

View File

@@ -149,14 +149,14 @@ class MultiModalDataCollatorForSeq2Seq(DataCollatorForSeq2Seq):
features.update(mm_inputs)
if isinstance(features.get("pixel_values"), list): # for pixtral inputs
features = features.data # use default_collate() instead of BatchEncoding.to()
if "image_bound" in features:
input_ids, position_ids = features['input_ids'], features['position_ids']
features['position_ids'] = F.pad(position_ids, (0, input_ids.shape[-1] - position_ids.shape[-1]))
if "image_bound" in features: # for minicpmv inputs
features = self.template.mm_plugin.pad_data(features)
new_features = {}
new_features.update({"data": features})
new_features.update(features)
features = new_features
return features