add multimodal LLM BLIP-2 and InstructBLIP

Former-commit-id: 67800c565b086f362b8cf131b0c9babaa7a7ebc7
2024-04-23 19:22:42 +08:00
parent 0b99b13786
commit 1451297c78
3 changed files with 4 additions and 6 deletions
--- a/src/llmtuner/data/loader.py
+++ b/src/llmtuner/data/loader.py
@@ -184,7 +184,6 @@ def get_mm_dataset(
        training_args: "Seq2SeqTrainingArguments",
        stage: Literal["pt", "sft", "rm", "ppo"],
 ) -> Union["Dataset", "IterableDataset"]:
-    tokenizer = processor.tokenizer
    if data_args.tokenized_path is not None:
        if has_tokenized_data(data_args.tokenized_path):
            logger.warning("Loading dataset from disk will ignore other data arguments.")