mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-08-22 13:42:51 +08:00
Merge pull request #4580 from hzhaoy/bugfix-deepspeed-pissa
Fix bug when using pissa method with deepspeed Former-commit-id: ef38daa0a49567bc4577136ac99e307cf535cf79
This commit is contained in:
commit
1dad756cff
@ -53,6 +53,9 @@ class CustomSeq2SeqTrainer(Seq2SeqTrainer):
|
|||||||
self.processor = processor
|
self.processor = processor
|
||||||
|
|
||||||
if finetuning_args.pissa_convert:
|
if finetuning_args.pissa_convert:
|
||||||
|
if self.is_deepspeed_enabled:
|
||||||
|
self.accelerator.deepspeed_config = self.accelerator.state.deepspeed_plugin.deepspeed_config
|
||||||
|
self.deepspeed = self._wrap_model(self.model_wrapped)
|
||||||
self.save_model(os.path.join(self.args.output_dir, "pissa_init"))
|
self.save_model(os.path.join(self.args.output_dir, "pissa_init"))
|
||||||
|
|
||||||
if finetuning_args.use_badam:
|
if finetuning_args.use_badam:
|
||||||
|
Loading…
x
Reference in New Issue
Block a user