update readme

2026-03-15 16:45:59 +08:00 · 2024-05-27 18:14:02 +08:00
parent 026e88ab74
commit 5581cb2e4e
10 changed files with 71 additions and 62 deletions
--- a/src/llamafactory/data/processors/pairwise.py
+++ b/src/llamafactory/data/processors/pairwise.py
@@ -1,6 +1,6 @@
 from typing import TYPE_CHECKING, Any, Dict, List, Optional

-from ...extras.constants import IGNORE_INDEX, IMAGE_TOKEN
+from ...extras.constants import IGNORE_INDEX
 from ...extras.logging import get_logger
 from .mm_utils import get_paligemma_token_type_ids, get_pixel_values

@@ -44,7 +44,7 @@ def preprocess_pairwise_dataset(
            continue

        if processor is not None and not hasattr(processor, "image_seq_length"):  # llava-like models
-            examples["prompt"][i][0]["content"] = IMAGE_TOKEN + examples["prompt"][i][0]["content"]
+            examples["prompt"][i][0]["content"] = template.image_token + examples["prompt"][i][0]["content"]

        chosen_messages = examples["prompt"][i] + [examples["response"][i][0]]
        rejected_messages = examples["prompt"][i] + [examples["response"][i][1]]
@@ -70,7 +70,7 @@ def preprocess_pairwise_dataset(
            rejected_ids += [tokenizer.eos_token_id]

        if processor is not None and hasattr(processor, "image_seq_length"):  # paligemma models
-            image_token_id = tokenizer.convert_tokens_to_ids(IMAGE_TOKEN)
+            image_token_id = tokenizer.convert_tokens_to_ids(template.image_token)
            prompt_ids = [image_token_id] * getattr(processor, "image_seq_length") + prompt_ids

        chosen_input_ids = prompt_ids + chosen_ids