mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2026-06-17 20:58:54 +08:00
[model] support Hy3-Preview (#10432)
This commit is contained in:
@@ -62,6 +62,10 @@ def add_z3_leaf_module(model: "PreTrainedModel") -> None:
|
||||
# deepseek v3 and kimi vl use custom code
|
||||
_set_z3_leaf_modules(model, ["DeepseekV3MoE"])
|
||||
|
||||
if model_type == "hy_v3":
|
||||
# hy3 uses custom code
|
||||
_set_z3_leaf_modules(model, ["HYV3MoE"])
|
||||
|
||||
if model_type == "ernie4_5_moe":
|
||||
from transformers.models.ernie4_5_moe.modeling_ernie4_5_moe import Ernie4_5_MoeSparseMoeBlock
|
||||
|
||||
|
||||
Reference in New Issue
Block a user