forked from p04798526/LLaMA-Factory-Mirror
Merge pull request #4580 from hzhaoy/bugfix-deepspeed-pissa
Fix bug when using pissa method with deepspeed
This commit is contained in:
commit
ef38daa0a4
|
@ -53,6 +53,9 @@ class CustomSeq2SeqTrainer(Seq2SeqTrainer):
|
|||
self.processor = processor
|
||||
|
||||
if finetuning_args.pissa_convert:
|
||||
if self.is_deepspeed_enabled:
|
||||
self.accelerator.deepspeed_config = self.accelerator.state.deepspeed_plugin.deepspeed_config
|
||||
self.deepspeed = self._wrap_model(self.model_wrapped)
|
||||
self.save_model(os.path.join(self.args.output_dir, "pissa_init"))
|
||||
|
||||
if finetuning_args.use_badam:
|
||||
|
|
Loading…
Reference in New Issue