Update dataset_info.json

Added the Nectar dataset already preprocessed and divided in sft and rl to which I added a preprompt to each instruction since it has been seen that this increase instruction following

Former-commit-id: 9468ee9012bfe7124fc5cc2acebcfe03a6d0cdee
This commit is contained in:
Marco 2023-11-30 16:21:34 +01:00 committed by GitHub
parent 3d291a82d3
commit a26f68ba47

View File

@ -266,6 +266,12 @@
"columns": { "columns": {
"prompt": "content" "prompt": "content"
} }
"nectar_rlaif": {
"hf_hub_url": "mlinmg/RLAIF-Nectar",
"ranking": true
},
"nectar_sft": {
"hf_hub_url": "mlinmg/SFT-Nectar"
}, },
"starcoder": { "starcoder": {
"hf_hub_url": "bigcode/starcoderdata", "hf_hub_url": "bigcode/starcoderdata",