From 3475198d1e11775c48ff2d00897c223644dccb50 Mon Sep 17 00:00:00 2001 From: Kingsley Date: Wed, 29 Apr 2026 20:20:55 +0800 Subject: [PATCH] [fa2] fix IMA when train qwen3_5 (#10448) --- src/llamafactory/model/patcher.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/llamafactory/model/patcher.py b/src/llamafactory/model/patcher.py index 1a258d552..be9c78df9 100644 --- a/src/llamafactory/model/patcher.py +++ b/src/llamafactory/model/patcher.py @@ -125,7 +125,7 @@ def patch_qwen3_5_forward(model: "PreTrainedModel") -> None: hidden_states, _ = self.self_attn( hidden_states=hidden_states, attention_mask=attention_mask, - position_ids=position_ids, + position_ids=position_ids[None, 0], # keep [1, B, L] past_key_values=past_key_values, cache_position=cache_position, position_embeddings=position_embeddings,