fix #1073 #1462 #1735 #1908

Former-commit-id: cd8e2535aa66931b24b96e76c2b56ce703a579b1
2026-03-20 04:46:01 +08:00 · 2023-12-20 17:15:40 +08:00
parent b5238e945a
commit 2b1e52dcc9
1 changed files with 3 additions and 0 deletions
--- a/src/llmtuner/train/sft/workflow.py
+++ b/src/llmtuner/train/sft/workflow.py
@@ -32,6 +32,9 @@ def run_sft(
    if training_args.predict_with_generate:
        tokenizer.padding_side = "left" # use left-padding in generation

+    if getattr(model, "is_quantized", False) and not training_args.do_train:
+        setattr(model, "_hf_peft_config_loaded", True) # hack here: make model compatible with prediction
+
    data_collator = DataCollatorForSeq2Seq(
        tokenizer=tokenizer,
        pad_to_multiple_of=8 if tokenizer.padding_side == "right" else None, # for shift short attention