Update dataset_info.json

Added the Nectar dataset already preprocessed and divided in sft and rl to which I added a preprompt to each instruction since it has been seen that this increase instruction following Former-commit-id: 9468ee9012
2026-06-22 15:19:00 +08:00 · 2023-11-30 16:21:34 +01:00
parent 3d291a82d3
commit a26f68ba47
1 changed files with 6 additions and 0 deletions
--- a/data/dataset_info.json
+++ b/data/dataset_info.json
@@ -266,6 +266,12 @@
    "columns": {
      "prompt": "content"
    }
  "nectar_rlaif": {
    "hf_hub_url": "mlinmg/RLAIF-Nectar",
    "ranking": true
  },
  "nectar_sft": {
    "hf_hub_url": "mlinmg/SFT-Nectar"
  },
  "starcoder": {
    "hf_hub_url": "bigcode/starcoderdata",