From dd4619e9f30cae0f894cf6b205b13beeaebd3331 Mon Sep 17 00:00:00 2001 From: BUAADreamer <1428195643@qq.com> Date: Tue, 14 May 2024 14:03:19 +0800 Subject: [PATCH] add support for Yi-VL Former-commit-id: d7834ca92d3048949caa48f8635cfbcea2c85771 --- src/llmtuner/model/utils/visual.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/src/llmtuner/model/utils/visual.py b/src/llmtuner/model/utils/visual.py index d1556bb3..79a6570e 100644 --- a/src/llmtuner/model/utils/visual.py +++ b/src/llmtuner/model/utils/visual.py @@ -43,10 +43,13 @@ class LlavaMultiModalProjectorYiVL(nn.Module): self.linear_3 = nn.Linear(config.text_config.hidden_size, config.text_config.hidden_size, bias=True) self.linear_4 = nn.LayerNorm(config.text_config.hidden_size, bias=True) self.act = nn.GELU() - self.proj = nn.Sequential(*[self.linear_1, self.linear_2, self.act, self.linear_3, self.linear_4]) def forward(self, image_features): - hidden_states = self.proj(image_features) + hidden_states = self.linear_1(image_features) + hidden_states = self.linear_2(hidden_states) + hidden_states = self.act(hidden_states) + hidden_states = self.linear_3(hidden_states) + hidden_states = self.linear_4(hidden_states) return hidden_states