Former-commit-id: ce2340193e751c4212650b27f16c671261015047
This commit is contained in:
hiyouga 2024-02-20 20:44:24 +08:00
parent e237f618c2
commit a3f30038a0
2 changed files with 4 additions and 4 deletions

View File

@ -112,9 +112,9 @@ def preprocess_packed_supervised_dataset(
input_ids += source_ids + target_ids
labels += source_mask + target_ids
if template.efficient_eos:
input_ids += [tokenizer.eos_token_id]
labels += [tokenizer.eos_token_id]
if template.efficient_eos:
input_ids += [tokenizer.eos_token_id]
labels += [tokenizer.eos_token_id]
total_length = len(input_ids)
block_size = data_args.cutoff_len

View File

@ -477,7 +477,7 @@ LOCALES = {
},
"zh": {
"label": "序列打包",
"info": "在指令监督微调阶段将序列打包为相同长度的样本。",
"info": "在指令监督微调时将序列打包为等长样本。",
},
},
"upcast_layernorm": {