Former-commit-id: 51df8657348ac3153e1a44143dc61008f10ab186
This commit is contained in:
hiyouga 2024-02-03 23:45:31 +08:00
parent 0fc8612b97
commit 961368a8c4

View File

@ -155,9 +155,6 @@ def get_dataset(
dataset = dataset.to_iterable_dataset()
return dataset
if data_args.streaming:
raise ValueError("Turn off dataset streaming to save cache files.")
with training_args.main_process_first(desc="load dataset"):
all_datasets = []
for dataset_attr in get_dataset_list(data_args): # TODO: add split