add llamafy_qwen.py

Former-commit-id: f9769cff8a
2026-03-08 12:46:06 +08:00 · 2023-10-08 22:05:36 +08:00
parent 93809d1c3b
commit 69c99819d6
3 changed files with 187 additions and 31 deletions
--- a/src/llmtuner/tuner/core/loader.py
+++ b/src/llmtuner/tuner/core/loader.py
@@ -128,7 +128,7 @@ def load_model_and_tokenizer(
        else:
            logger.warning("Current model does not support RoPE scaling.")

-    # Set FlashAttention-2
+    # Set FlashAttention-2 and S^2-Attn
    if model_args.flash_attn:
        if getattr(config, "model_type", None) == "llama":
            LlamaModule.LlamaAttention = LlamaPatches.LlamaFlashAttention2