From 8669a22e9cffa9afe38e005eb20de906cbb44398 Mon Sep 17 00:00:00 2001 From: jiaqiw09 <60021713+jiaqiw09@users.noreply.github.com> Date: Tue, 16 Jun 2026 18:21:52 +0800 Subject: [PATCH] [fix] fix liger kernel patch for npu (#10583) --- src/llamafactory/model/model_utils/liger_kernel.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/src/llamafactory/model/model_utils/liger_kernel.py b/src/llamafactory/model/model_utils/liger_kernel.py index 56b64b03a..4f63e10c1 100644 --- a/src/llamafactory/model/model_utils/liger_kernel.py +++ b/src/llamafactory/model/model_utils/liger_kernel.py @@ -16,6 +16,7 @@ import inspect from typing import TYPE_CHECKING from ...extras import logging +from ...extras.misc import get_device_name if TYPE_CHECKING: @@ -99,5 +100,12 @@ def apply_liger_kernel( else: kwargs = {} + if get_device_name() == "npu": + import torch + + if "Ascend910" not in torch.npu.get_device_name(0): + kwargs["swiglu"] = False + kwargs["fused_linear_cross_entropy"] = False + apply_liger_kernel(**kwargs) logger.info_rank0("Liger kernel has been applied to the model.")