diff --git a/src/llamafactory/model/model_utils/visual.py b/src/llamafactory/model/model_utils/visual.py index dd6de0986..4a855f31a 100644 --- a/src/llamafactory/model/model_utils/visual.py +++ b/src/llamafactory/model/model_utils/visual.py @@ -390,14 +390,14 @@ _register_composite_model( "visual.deepstack_merger_list", "audio_tower", ], - language_model_keys=["model", "lm_head"], + language_model_keys=["language_model", "lm_head"], lora_conflict_keys=["patch_embed"], ) _register_composite_model( model_type="qwen3_5", - projector_key="visual.merger", + projector_key="model.visual.merger", vision_model_keys=["visual.pos_embed", "visual.patch_embed", "visual.blocks"], language_model_keys=["language_model", "lm_head"], lora_conflict_keys=["patch_embed"], @@ -406,7 +406,7 @@ _register_composite_model( _register_composite_model( model_type="qwen3_5_moe", - projector_key="visual.merger", + projector_key="model.visual.merger", vision_model_keys=["visual.pos_embed", "visual.patch_embed", "visual.blocks"], language_model_keys=["language_model", "lm_head"], lora_conflict_keys=["patch_embed"],