Merge pull request #4580 from hzhaoy/bugfix-deepspeed-pissa

Fix bug when using pissa method with deepspeed

Former-commit-id: ef38daa0a49567bc4577136ac99e307cf535cf79
This commit is contained in:
hoshi-hiyouga 2024-06-28 00:46:51 +08:00 committed by GitHub
commit 1dad756cff

View File

@ -53,6 +53,9 @@ class CustomSeq2SeqTrainer(Seq2SeqTrainer):
self.processor = processor
if finetuning_args.pissa_convert:
if self.is_deepspeed_enabled:
self.accelerator.deepspeed_config = self.accelerator.state.deepspeed_plugin.deepspeed_config
self.deepspeed = self._wrap_model(self.model_wrapped)
self.save_model(os.path.join(self.args.output_dir, "pissa_init"))
if finetuning_args.use_badam: