[model] support GLM-4.7-Flash SFT (#10173)

Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
2026-03-02 01:36:02 +08:00 · 2026-02-09 08:10:44 +05:30
parent 92fa3df4c4
commit ea644d04ec
3 changed files with 45 additions and 0 deletions
--- a/src/llamafactory/model/model_utils/moe.py
+++ b/src/llamafactory/model/model_utils/moe.py
@@ -77,6 +77,11 @@ def add_z3_leaf_module(model: "PreTrainedModel") -> None:

        _set_z3_leaf_modules(model, [Glm4MoeMoE])

+    if model_type == "glm4_moe_lite":
+        from transformers.models.glm4_moe_lite.modeling_glm4_moe_lite import Glm4MoeLiteMoE
+
+        _set_z3_leaf_modules(model, [Glm4MoeLiteMoE])
+
    if model_type == "glm4v_moe":
        from transformers.models.glm4v_moe.modeling_glm4v_moe import Glm4vMoeTextMoE