support LongLoRA

This commit is contained in:
hiyouga
2023-09-27 21:55:50 +08:00
parent 4dd9b4d982
commit 90375f600d
8 changed files with 313 additions and 329 deletions

View File

@@ -90,6 +90,10 @@ class DataArguments:
default=0,
metadata={"help": "Size of the development set, should be an integer or a float in range `[0,1)`."}
)
sft_packing: Optional[bool] = field(
default=False,
metadata={"help": "Packing the questions and answers in the supervised fine-tuning stage."}
)
def init_for_training(self): # support mixing multiple datasets
dataset_names = [ds.strip() for ds in self.dataset.split(",")]