Update dataset_info.json

Added the Nectar dataset already preprocessed and divided in sft and rl to which I added a preprompt to each instruction since it has been seen that this increase instruction following

Former-commit-id: 9468ee9012bfe7124fc5cc2acebcfe03a6d0cdee
This commit is contained in:
Marco 2023-11-30 16:21:34 +01:00 committed by GitHub
parent 3d291a82d3
commit a26f68ba47

View File

@ -266,6 +266,12 @@
"columns": {
"prompt": "content"
}
"nectar_rlaif": {
"hf_hub_url": "mlinmg/RLAIF-Nectar",
"ranking": true
},
"nectar_sft": {
"hf_hub_url": "mlinmg/SFT-Nectar"
},
"starcoder": {
"hf_hub_url": "bigcode/starcoderdata",