Former-commit-id: dbaef776a171dfb316567553788f2d81d35a51fb
This commit is contained in:
hiyouga 2023-09-21 19:52:06 +08:00
parent 4581d09fa6
commit 3bdc40b4db

View File

@ -39,7 +39,7 @@ def run_sft(
# Override the decoding parameters of Seq2SeqTrainer # Override the decoding parameters of Seq2SeqTrainer
training_args_dict = training_args.to_dict() training_args_dict = training_args.to_dict()
training_args_dict.update(dict( training_args_dict.update(dict(
generation_max_length=training_args.generation_max_length or data_args.max_target_length, generation_max_length=training_args.generation_max_length or data_args.cutoff_len,
generation_num_beams=data_args.eval_num_beams or training_args.generation_num_beams generation_num_beams=data_args.eval_num_beams or training_args.generation_num_beams
)) ))
training_args = Seq2SeqTrainingArguments(**training_args_dict) training_args = Seq2SeqTrainingArguments(**training_args_dict)