add multimodal LLM BLIP-2 and InstructBLIP

Former-commit-id: 67800c565b086f362b8cf131b0c9babaa7a7ebc7
This commit is contained in:
BUAADreamer
2024-04-23 19:22:42 +08:00
parent 0b99b13786
commit 1451297c78
3 changed files with 4 additions and 6 deletions

View File

@@ -184,7 +184,6 @@ def get_mm_dataset(
training_args: "Seq2SeqTrainingArguments",
stage: Literal["pt", "sft", "rm", "ppo"],
) -> Union["Dataset", "IterableDataset"]:
tokenizer = processor.tokenizer
if data_args.tokenized_path is not None:
if has_tokenized_data(data_args.tokenized_path):
logger.warning("Loading dataset from disk will ignore other data arguments.")