fix possibly OOM error

Former-commit-id: 0d590dffb41b0e832d9f87d20a23bcd0acd983aa
This commit is contained in:
hiyouga 2023-06-01 23:54:44 +08:00
parent 1512711ca2
commit 896dbfec16

View File

@ -477,13 +477,13 @@ def preprocess_data(
desc="Running tokenizer on dataset" desc="Running tokenizer on dataset"
) )
if stage == "pt": if stage == "pt":
print_unsupervised_dataset_example(dataset[0]) print_unsupervised_dataset_example(dataset[0])
elif stage == "sft": elif stage == "sft":
print_supervised_dataset_example(dataset[0]) print_supervised_dataset_example(dataset[0])
elif stage == "rm": elif stage == "rm":
print_pairwise_dataset_example(dataset[0]) print_pairwise_dataset_example(dataset[0])
elif stage == "ppo": elif stage == "ppo":
print_unsupervised_dataset_example(dataset[0]) print_unsupervised_dataset_example(dataset[0])
return dataset return dataset