update dataset

Former-commit-id: 4fc2c3293d91d8464527ebd1ddabe572c8355616
This commit is contained in:
hiyouga
2023-07-23 20:01:43 +08:00
parent 3ee37a76e6
commit 9802398c71
4 changed files with 47 additions and 3 deletions

View File

@@ -21,7 +21,7 @@
},
"oaast_sft": {
"file_name": "oaast_sft.json",
"file_sha1": "08912e34fb165db137d3436db4c35321e33b28d1",
"file_sha1": "7baf5d43e67a91f9bbdf4e400dbe033b87e9757e",
"columns": {
"prompt": "instruction",
"query": "input",
@@ -31,7 +31,7 @@
},
"oaast_sft_zh": {
"file_name": "oaast_sft_zh.json",
"file_sha1": "e0a2e7e8eff355434ada6c9b7f70bb915f941dd4",
"file_sha1": "a6a91f18f80f37b10ded9cf633fb50c033bf7b9f",
"columns": {
"prompt": "instruction",
"query": "input",
@@ -187,5 +187,41 @@
"response": "",
"history": ""
}
},
"refinedweb": {
"hf_hub_url": "tiiuae/falcon-refinedweb",
"columns": {
"prompt": "content",
"query": "",
"response": "",
"history": ""
}
},
"starcoder": {
"hf_hub_url": "bigcode/starcoderdata",
"columns": {
"prompt": "content",
"query": "",
"response": "",
"history": ""
}
},
"wikipedia_en": {
"hf_hub_url": "olm/olm-wikipedia-20221220",
"columns": {
"prompt": "text",
"query": "",
"response": "",
"history": ""
}
},
"wikipedia_zh": {
"hf_hub_url": "pleisto/wikipedia-cn-20230720-filtered",
"columns": {
"prompt": "completion",
"query": "",
"response": "",
"history": ""
}
}
}