fix handling of ddp_find_unused_parameters
This commit is contained in:
@@ -1000,9 +1000,14 @@ class HFCausalTrainerBuilder(TrainerBuilderBase):
|
|||||||
and self.cfg.eval_steps
|
and self.cfg.eval_steps
|
||||||
and self.cfg.save_steps % self.cfg.eval_steps == 0
|
and self.cfg.save_steps % self.cfg.eval_steps == 0
|
||||||
) or False
|
) or False
|
||||||
training_arguments_kwargs["ddp_find_unused_parameters"] = (
|
ddp_find_unused_parameters = (
|
||||||
False if self.cfg.ddp else None
|
self.cfg.ddp_find_unused_parameters
|
||||||
|
if self.cfg.ddp_find_unused_parameters is not None
|
||||||
|
else (False if self.cfg.ddp else None)
|
||||||
)
|
)
|
||||||
|
training_arguments_kwargs[
|
||||||
|
"ddp_find_unused_parameters"
|
||||||
|
] = ddp_find_unused_parameters
|
||||||
training_arguments_kwargs["group_by_length"] = self.cfg.group_by_length
|
training_arguments_kwargs["group_by_length"] = self.cfg.group_by_length
|
||||||
report_to = None
|
report_to = None
|
||||||
if self.cfg.use_wandb:
|
if self.cfg.use_wandb:
|
||||||
|
|||||||
Reference in New Issue
Block a user