support full-parameter PPO

Former-commit-id: 4af967d69475e1c9fdf1a7983cd6b83bd431abff
This commit is contained in:
hiyouga
2023-11-16 02:08:04 +08:00
parent c970270c94
commit 685d0c975a
20 changed files with 288 additions and 145 deletions

View File

@@ -88,11 +88,7 @@
},
"belle_multiturn": {
"script_url": "belle_multiturn",
"columns": {
"prompt": "instruction",
"response": "output",
"history": "history"
}
"formatting": "sharegpt"
},
"ultra_chat": {
"script_url": "ultra_chat",
@@ -107,6 +103,13 @@
"alpaca_cot": {
"hf_hub_url": "QingyiSi/Alpaca-CoT"
},
"openorca": {
"hf_hub_url": "Open-Orca/OpenOrca",
"columns": {
"prompt": "question",
"response": "response"
}
},
"mathinstruct": {
"hf_hub_url": "TIGER-Lab/MathInstruct",
"columns": {