support layerwise galore

This commit is contained in:
hiyouga
2024-03-10 00:24:11 +08:00
parent 18ffce36b5
commit 8664262cde
14 changed files with 109 additions and 51 deletions

View File

@@ -50,7 +50,7 @@ def run_sft(
training_args.generation_num_beams = data_args.eval_num_beams or training_args.generation_num_beams
# Initialize our Trainer
optimizer = create_custom_optimzer(model, training_args, finetuning_args)
optimizer = create_custom_optimzer(model, dataset, training_args, finetuning_args)
trainer = CustomSeq2SeqTrainer(
model=model,
args=training_args,