fix #3365

Former-commit-id: 415ce41e8fa887e980e5bd575c8e95bd4076b90b
2025-11-05 18:32:14 +08:00 · 2024-04-21 19:20:18 +08:00 · 2024-04-21 19:20:18 +08:00 · 04da91e84e
commit 04da91e84e
parent b353a080cb
1 changed files with 1 additions and 0 deletions
--- a/src/llmtuner/model/patcher.py
+++ b/src/llmtuner/model/patcher.py
@ -139,6 +139,7 @@ def _configure_quantization(
        if quant_method == QuantizationMethod.GPTQ:
            require_version("auto_gptq>=0.5.0", "To fix: pip install auto_gptq>=0.5.0")
            quantization_config.pop("disable_exllama", None)  # remove deprecated args
            quantization_config["use_exllama"] = False  # disable exllama
        if quant_method == QuantizationMethod.AWQ: