From 2918743520a488df914305f9d24e105d3465e784 Mon Sep 17 00:00:00 2001 From: "xingjun.wang" Date: Tue, 12 Dec 2023 11:47:59 +0800 Subject: [PATCH] for test Former-commit-id: 8a908a8c644f4a961001cdd8388a3a7fea992c55 --- src/llmtuner/data/loader.py | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/src/llmtuner/data/loader.py b/src/llmtuner/data/loader.py index 41c12422..70beea05 100644 --- a/src/llmtuner/data/loader.py +++ b/src/llmtuner/data/loader.py @@ -59,6 +59,13 @@ def get_dataset( dataset_name=data_path, subset_name=data_name, ).to_hf_dataset() + + def map_func(example): + # do something to example + example['input'] = example['input'] or '' + return example + + dataset = dataset.ds_instance.map(map_func) else: dataset = load_dataset( path=data_path,