diff --git a/requirements/liger-kernel.txt b/requirements/liger-kernel.txt index bd27a1a0f..1fd2178ac 100644 --- a/requirements/liger-kernel.txt +++ b/requirements/liger-kernel.txt @@ -1 +1 @@ -liger-kernel>=0.5.5 +liger-kernel>=0.6.3 diff --git a/src/llamafactory/model/model_utils/liger_kernel.py b/src/llamafactory/model/model_utils/liger_kernel.py index a8f0e842e..70ed8a098 100644 --- a/src/llamafactory/model/model_utils/liger_kernel.py +++ b/src/llamafactory/model/model_utils/liger_kernel.py @@ -77,6 +77,8 @@ def apply_liger_kernel( from liger_kernel.transformers import apply_liger_kernel_to_qwen3 as apply_liger_kernel elif model_type == "qwen3_moe": from liger_kernel.transformers import apply_liger_kernel_to_qwen3_moe as apply_liger_kernel + elif model_type == "qwen3_next": + from liger_kernel.transformers import apply_liger_kernel_to_qwen3_next as apply_liger_kernel elif model_type == "gpt_oss": try: from liger_kernel.transformers import apply_liger_kernel_to_gpt_oss as apply_liger_kernel