update info

Former-commit-id: 17c64a05796cac70fc76ed728705cd60efa41cae
2025-11-08 22:34:46 +08:00 · 2023-11-07 16:28:21 +08:00 · 2023-11-07 16:28:21 +08:00 · 53fcc531b5
commit 53fcc531b5
parent 1f2c56bff9
1 changed files with 2 additions and 2 deletions
--- a/src/llmtuner/tuner/core/loader.py
+++ b/src/llmtuner/tuner/core/loader.py
@ -128,8 +128,8 @@ def load_model_and_tokenizer(
            LlamaModule.LlamaAttention = LlamaPatches.LlamaFlashAttention2
            LlamaModule.LlamaModel._prepare_decoder_attention_mask = LlamaPatches._prepare_decoder_attention_mask
            logger.info("Using FlashAttention-2 for faster training and inference.")
-        elif getattr(config, "model_type", None) == "qwen":
-            logger.info("Qwen models automatically enable FlashAttention if installed.")
+        elif getattr(config, "model_type", None) in ["qwen", "Yi"]:
+            logger.info("Current model automatically enables FlashAttention if installed.")
        else:
            logger.warning("Current model does not support FlashAttention-2.")
    elif is_trainable and model_args.shift_attn and getattr(config, "model_type", None) == "llama":