fix SFT trainer

Former-commit-id: bf09b6a6cd75cc2738d9af6b8c30bcbba77fa9b5
2025-10-15 08:08:09 +08:00 · 2023-10-31 21:52:52 +08:00 · 2023-10-31 21:52:52 +08:00 · 2406200914
commit 2406200914
parent db06fcfc84
1 changed files with 1 additions and 1 deletions
--- a/src/llmtuner/tuner/sft/trainer.py
+++ b/src/llmtuner/tuner/sft/trainer.py
@ -33,10 +33,10 @@ class CustomSeq2SeqTrainer(Seq2SeqTrainer):
        Subclass and override to inject custom behavior.
        """
        labels = inputs["labels"].clone() if "labels" in inputs else None # backup labels
        if self.args.predict_with_generate:
            assert self.tokenizer.padding_side == "left", "This method only accepts left-padded tensor."
            prompt_len, label_len = inputs["input_ids"].size(-1), inputs["labels"].size(-1)
            labels = inputs["labels"].clone()
            if prompt_len > label_len:
                inputs["labels"] = self._pad_tensors_to_target_len(inputs["labels"], inputs["input_ids"])
            if label_len > prompt_len: