From 5b4b60cfb5e9196c223c06b68eeb9f22d2024e96 Mon Sep 17 00:00:00 2001 From: simonJJJ <821898965@qq.com> Date: Wed, 28 Aug 2024 20:22:46 +0800 Subject: [PATCH] update Former-commit-id: a968a416d5e513320c97109229ca1e6ddc003cb1 --- src/llamafactory/data/processors/supervised.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/llamafactory/data/processors/supervised.py b/src/llamafactory/data/processors/supervised.py index 90da57a1..6b3a4562 100644 --- a/src/llamafactory/data/processors/supervised.py +++ b/src/llamafactory/data/processors/supervised.py @@ -68,7 +68,7 @@ def _encode_supervised_example( ) index += 1 message["content"] = content.replace("<|placeholder|>", "<|image_pad|>") - if processor is not None and not hasattr(processor, "image_seq_length"): # llava-like models + elif processor is not None and not hasattr(processor, "image_seq_length"): # llava-like models prompt[0]["content"] = template.image_token + prompt[0]["content"] messages = prompt + response @@ -146,6 +146,7 @@ def preprocess_supervised_dataset( response=examples["response"][i], system=examples["system"][i], tools=examples["tools"][i], + images=examples["images"][i], template=template, tokenizer=tokenizer, processor=processor,