diff --git a/src/llamafactory/data/mm_plugin.py b/src/llamafactory/data/mm_plugin.py index be8cea9d..a3a6a4d9 100644 --- a/src/llamafactory/data/mm_plugin.py +++ b/src/llamafactory/data/mm_plugin.py @@ -1630,6 +1630,9 @@ class GLM4VPlugin(Qwen2VLPlugin): ) video_structure += frame_structure + if not self.expand_mm_tokens: + video_structure = self.video_token + content = content.replace(VIDEO_PLACEHOLDER, f"<|begin_of_video|>{video_structure}<|end_of_video|>", 1) num_video_tokens += 1