update dataset

Former-commit-id: f5c2ccdde45bfa5648443a901b2ac397d532eceb
This commit is contained in:
hiyouga 2023-07-26 17:05:12 +08:00
parent c52dd3e86f
commit ba911f988d
6 changed files with 6433 additions and 4 deletions

View File

@ -83,6 +83,7 @@
- [BELLE School Math 0.25M (zh)](https://huggingface.co/datasets/BelleGroup/school_math_0.25M) - [BELLE School Math 0.25M (zh)](https://huggingface.co/datasets/BelleGroup/school_math_0.25M)
- [BELLE Multiturn Chat 0.8M (zh)](https://huggingface.co/datasets/BelleGroup/multiturn_chat_0.8M) - [BELLE Multiturn Chat 0.8M (zh)](https://huggingface.co/datasets/BelleGroup/multiturn_chat_0.8M)
- [Firefly 1.1M (zh)](https://huggingface.co/datasets/YeungNLP/firefly-train-1.1M) - [Firefly 1.1M (zh)](https://huggingface.co/datasets/YeungNLP/firefly-train-1.1M)
- [LIMA (en)](https://huggingface.co/datasets/GAIR/lima)
- [CodeAlpaca 20k (en)](https://huggingface.co/datasets/sahil2801/CodeAlpaca-20k) - [CodeAlpaca 20k (en)](https://huggingface.co/datasets/sahil2801/CodeAlpaca-20k)
- [Alpaca CoT (multilingual)](https://huggingface.co/datasets/QingyiSi/Alpaca-CoT) - [Alpaca CoT (multilingual)](https://huggingface.co/datasets/QingyiSi/Alpaca-CoT)
- [Web QA (zh)](https://huggingface.co/datasets/suolyer/webqa) - [Web QA (zh)](https://huggingface.co/datasets/suolyer/webqa)

View File

@ -83,6 +83,7 @@
- [BELLE School Math 0.25M (zh)](https://huggingface.co/datasets/BelleGroup/school_math_0.25M) - [BELLE School Math 0.25M (zh)](https://huggingface.co/datasets/BelleGroup/school_math_0.25M)
- [BELLE Multiturn Chat 0.8M (zh)](https://huggingface.co/datasets/BelleGroup/multiturn_chat_0.8M) - [BELLE Multiturn Chat 0.8M (zh)](https://huggingface.co/datasets/BelleGroup/multiturn_chat_0.8M)
- [Firefly 1.1M (zh)](https://huggingface.co/datasets/YeungNLP/firefly-train-1.1M) - [Firefly 1.1M (zh)](https://huggingface.co/datasets/YeungNLP/firefly-train-1.1M)
- [LIMA (en)](https://huggingface.co/datasets/GAIR/lima)
- [CodeAlpaca 20k (en)](https://huggingface.co/datasets/sahil2801/CodeAlpaca-20k) - [CodeAlpaca 20k (en)](https://huggingface.co/datasets/sahil2801/CodeAlpaca-20k)
- [Alpaca CoT (multilingual)](https://huggingface.co/datasets/QingyiSi/Alpaca-CoT) - [Alpaca CoT (multilingual)](https://huggingface.co/datasets/QingyiSi/Alpaca-CoT)
- [Web QA (zh)](https://huggingface.co/datasets/suolyer/webqa) - [Web QA (zh)](https://huggingface.co/datasets/suolyer/webqa)

View File

@ -51,7 +51,7 @@
}, },
"refgpt_zh_p1": { "refgpt_zh_p1": {
"file_name": "refgpt_zh_50k_p1.json", "file_name": "refgpt_zh_50k_p1.json",
"file_sha1": "995043a909eed6693f850a96fccb4d3803f3ea5e", "file_sha1": "b40f4f4d0ffacd16da7c275b056d5b6670021752",
"columns": { "columns": {
"prompt": "instruction", "prompt": "instruction",
"query": "input", "query": "input",
@ -61,7 +61,17 @@
}, },
"refgpt_zh_p2": { "refgpt_zh_p2": {
"file_name": "refgpt_zh_50k_p2.json", "file_name": "refgpt_zh_50k_p2.json",
"file_sha1": "d9442d5c4541fe5489b5b571871fbe7595ee3809", "file_sha1": "181f32b2c60264a29f81f59d3c76095793eae1b0",
"columns": {
"prompt": "instruction",
"query": "input",
"response": "output",
"history": "history"
}
},
"lima": {
"file_name": "lima.json",
"file_sha1": "9db59f6b7007dc4b17529fc63379b9cd61640f37",
"columns": { "columns": {
"prompt": "instruction", "prompt": "instruction",
"query": "input", "query": "input",

6417
data/lima.json Normal file

File diff suppressed because one or more lines are too long

View File

@ -1 +1 @@
56405bb8f52727e52e99693739494b9b7b0d7ba6 f967a4f6d04a11308a15524aa9a846a19a8d1e83

View File

@ -1 +1 @@
fa935248a5d40d2bdd5649af99a72a754d40ae7a 0a4f0d74fd1c5cab2eb6d84a3a3fe669847becd8