merge data part to the text stream

Former-commit-id: 42c90c8183
This commit is contained in:
BUAADreamer
2024-04-25 19:58:47 +08:00
parent c50474869f
commit 56028422e8
6 changed files with 18 additions and 38 deletions

View File

@@ -414,9 +414,6 @@
},
"folder": "python"
},
"llava_instruct": {
"hf_hub_url": "HuggingFaceH4/llava-instruct-mix-vsft"
},
"mllm_instruct_example": {
"file_name": "llava_instruct_example.json",
"formatting": "llava",

View File

@@ -1,25 +0,0 @@
---
dataset_info:
features:
- name: messages
list:
- name: content
list:
- name: index
dtype: int64
- name: text
dtype: string
- name: type
dtype: string
- name: role
dtype: string
- name: images
sequence: image
configs:
- config_name: default
data_files:
- split: train
path: data/train-*
- split: test
path: data/test-*
---