fix #4917

Former-commit-id: 26082fc6c90e6a399ae5b44f2c3df8019afc7766
2025-11-09 14:55:40 +08:00 · 2024-07-22 11:28:31 +08:00 · 2024-07-22 11:28:31 +08:00 · 37c6a0c6dc
commit 37c6a0c6dc
parent dbe26e7cdf
1 changed files with 0 additions and 3 deletions
--- a/src/llamafactory/model/patcher.py
+++ b/src/llamafactory/model/patcher.py
@ -89,9 +89,6 @@ def patch_config(
    if getattr(config, "model_type", None) == "qwen2" and is_trainable and model_args.flash_attn == "fa2":
        setattr(config, "use_cache", False)  # qwen2 does not support use_cache when using flash attn
    if getattr(config, "model_type", None) == "chatglm":
        require_version("transformers==4.41.2", "To fix: pip install transformers==4.41.2")
    # deepspeed zero3 is not compatible with low_cpu_mem_usage
    init_kwargs["low_cpu_mem_usage"] = model_args.low_cpu_mem_usage and (not is_deepspeed_zero3_enabled())