refactor mm training

Former-commit-id: 3382317e32
This commit is contained in:
hiyouga
2024-08-30 02:14:31 +08:00
parent 98b0c7530c
commit a83756b5e9
32 changed files with 505 additions and 472 deletions

View File

@@ -38,20 +38,6 @@
"assistant_tag": "assistant"
}
},
"qwen2vl_demo": {
"file_name": "qwen2vl_demo.json",
"formatting": "sharegpt",
"columns": {
"messages": "messages",
"images": "images"
},
"tags": {
"role_tag": "role",
"content_tag": "content",
"user_tag": "user",
"assistant_tag": "assistant"
}
},
"alpaca_en": {
"hf_hub_url": "llamafactory/alpaca_en",
"ms_hub_url": "llamafactory/alpaca_en"

View File

@@ -2,7 +2,7 @@
{
"messages": [
{
"content": "Who are they?",
"content": "<image>Who are they?",
"role": "user"
},
{
@@ -25,7 +25,7 @@
{
"messages": [
{
"content": "Who is he?",
"content": "<image>Who is he?",
"role": "user"
},
{
@@ -48,7 +48,7 @@
{
"messages": [
{
"content": "Please describe this image",
"content": "<image>Please describe this image",
"role": "user"
},
{
@@ -71,7 +71,7 @@
{
"messages": [
{
"content": "他们是谁?",
"content": "<image>他们是谁?",
"role": "user"
},
{
@@ -94,7 +94,7 @@
{
"messages": [
{
"content": "他是谁?",
"content": "<image>他是谁?",
"role": "user"
},
{
@@ -117,7 +117,7 @@
{
"messages": [
{
"content": "请描述这张图片",
"content": "<image>请描述这张图片",
"role": "user"
},
{

View File

@@ -1,140 +0,0 @@
[
{
"messages": [
{
"content": "<|image_pad|>Who are they?",
"role": "user"
},
{
"content": "They're Kane and Gretzka from Bayern Munich.",
"role": "assistant"
},
{
"content": "What are they doing?",
"role": "user"
},
{
"content": "They are celebrating on the soccer field.",
"role": "assistant"
}
],
"images": [
"mllm_demo_data/1.jpg"
]
},
{
"messages": [
{
"content": "<|image_pad|>Who is he?",
"role": "user"
},
{
"content": "He's Thomas Muller from Bayern Munich.",
"role": "assistant"
},
{
"content": "<|image_pad|>Why is he on the ground?",
"role": "user"
},
{
"content": "Because he's sliding on his knees to celebrate.",
"role": "assistant"
}
],
"images": [
"mllm_demo_data/2.jpg","mllm_demo_data/2.jpg"
]
},
{
"messages": [
{
"content": "<|image_pad|>Please describe this image",
"role": "user"
},
{
"content": "Chinese astronaut Gui Haichao is giving a speech.",
"role": "assistant"
},
{
"content": "What has he accomplished?",
"role": "user"
},
{
"content": "He was appointed to be a payload specialist on Shenzhou 16 mission in June 2022, thus becoming the first Chinese civilian of Group 3 in space on 30 May 2023. He is responsible for the on-orbit operation of space science experimental payloads.",
"role": "assistant"
}
],
"images": [
"mllm_demo_data/3.jpg"
]
},
{
"messages": [
{
"content": "<|image_pad|>他们是谁?",
"role": "user"
},
{
"content": "他们是拜仁慕尼黑的凯恩和格雷茨卡。",
"role": "assistant"
},
{
"content": "<|image_pad|>他们在做什么?",
"role": "user"
},
{
"content": "他们在足球场上庆祝。",
"role": "assistant"
}
],
"images": [
"mllm_demo_data/1.jpg","mllm_demo_data/1.jpg"
]
},
{
"messages": [
{
"content": "<|image_pad|>他是谁?",
"role": "user"
},
{
"content": "他是来自拜仁慕尼黑的托马斯·穆勒。",
"role": "assistant"
},
{
"content": "他为什么在地上?",
"role": "user"
},
{
"content": "因为他正在双膝跪地滑行庆祝。",
"role": "assistant"
}
],
"images": [
"mllm_demo_data/2.jpg"
]
},
{
"messages": [
{
"content": "<|image_pad|>请描述这张图片",
"role": "user"
},
{
"content": "中国宇航员桂海潮正在讲话。",
"role": "assistant"
},
{
"content": "他取得过哪些成就?",
"role": "user"
},
{
"content": "他于2022年6月被任命为神舟十六号任务的有效载荷专家从而成为2023年5月30日进入太空的首位平民宇航员。他负责在轨操作空间科学实验有效载荷。",
"role": "assistant"
}
],
"images": [
"mllm_demo_data/3.jpg"
]
}
]