Former-commit-id: 02c8c55ce36b242338219a9a9132edfc52302206
This commit is contained in:
hiyouga 2024-02-20 20:44:24 +08:00
parent ba48084086
commit e87a17464f
2 changed files with 4 additions and 4 deletions

View File

@ -112,9 +112,9 @@ def preprocess_packed_supervised_dataset(
input_ids += source_ids + target_ids input_ids += source_ids + target_ids
labels += source_mask + target_ids labels += source_mask + target_ids
if template.efficient_eos: if template.efficient_eos:
input_ids += [tokenizer.eos_token_id] input_ids += [tokenizer.eos_token_id]
labels += [tokenizer.eos_token_id] labels += [tokenizer.eos_token_id]
total_length = len(input_ids) total_length = len(input_ids)
block_size = data_args.cutoff_len block_size = data_args.cutoff_len

View File

@ -477,7 +477,7 @@ LOCALES = {
}, },
"zh": { "zh": {
"label": "序列打包", "label": "序列打包",
"info": "在指令监督微调阶段将序列打包为相同长度的样本。", "info": "在指令监督微调时将序列打包为等长样本。",
}, },
}, },
"upcast_layernorm": { "upcast_layernorm": {