fix cache dir

Former-commit-id: 1909f0d11732bd99fadc6c1191e026137c6a7dff
This commit is contained in:
xingjun.wang 2023-12-12 14:21:33 +08:00
parent c1974c91e5
commit 1bd75afae8

View File

@ -55,16 +55,8 @@ def get_dataset(
if int(os.environ.get('USE_MODELSCOPE_HUB', '0')) and dataset_attr.load_from == "ms_hub": if int(os.environ.get('USE_MODELSCOPE_HUB', '0')) and dataset_attr.load_from == "ms_hub":
from modelscope import MsDataset from modelscope import MsDataset
cache_dir = model_args.cache_dir from modelscope.utils.config_ds import MS_DATASETS_CACHE
cache_dir = str(cache_dir) if cache_dir is not None else None cache_dir = model_args.cache_dir or MS_DATASETS_CACHE
print(f'>data_path: {data_path}, '
f'>data_name: {data_name}, '
f'>split: {data_args.split},'
f'>data_files: {data_files}, '
f'>cache_dir: {cache_dir},'
f'>token: {model_args.ms_hub_token},'
f'>streaming: {data_args.streaming}')
dataset = MsDataset.load( dataset = MsDataset.load(
dataset_name=data_path, dataset_name=data_path,