Former-commit-id: 415ce41e8fa887e980e5bd575c8e95bd4076b90b
This commit is contained in:
hiyouga 2024-04-21 19:20:18 +08:00
parent d16561e7a4
commit 1d341dcd83

View File

@ -139,6 +139,7 @@ def _configure_quantization(
if quant_method == QuantizationMethod.GPTQ:
require_version("auto_gptq>=0.5.0", "To fix: pip install auto_gptq>=0.5.0")
quantization_config.pop("disable_exllama", None) # remove deprecated args
quantization_config["use_exllama"] = False # disable exllama
if quant_method == QuantizationMethod.AWQ: