support DPO training (2305.18290)

Former-commit-id: 6d98de148e4af63a7028dfaeb6cf86eb56a4488f
This commit is contained in:
hiyouga
2023-08-11 03:02:53 +08:00
parent 50345ed29a
commit 7ada4f5f6f
34 changed files with 513 additions and 212 deletions

View File

@@ -3,7 +3,7 @@ transformers>=4.29.1
datasets>=2.12.0
accelerate>=0.21.0
peft>=0.4.0
trl>=0.4.7
trl>=0.5.0
scipy
sentencepiece
tiktoken
@@ -16,4 +16,3 @@ pydantic==1.10.11
fastapi==0.95.1
sse-starlette
matplotlib
huggingface_hub