Compare commits

...

2 Commits

Author SHA1 Message Date
Wing Lian
bb65157dcf fix conditional for None values 2025-08-17 12:49:48 -04:00
Wing Lian
7fd3d8abc4 handle batch size correchtly when using split and dispatch batches 2025-08-16 22:05:31 -04:00
3 changed files with 15 additions and 1 deletions

View File

@@ -424,7 +424,7 @@ class HFCausalTrainerBuilder(TrainerBuilderBase):
):
if training_args.pretraining:
if (
self.cfg.pretraining_sample_concatenation is False
not self.cfg.pretraining_sample_concatenation
or self.cfg.micro_batch_size > 1
):
return DataCollatorForSeq2Seq(self.tokenizer, **kwargs)

View File

@@ -272,6 +272,20 @@ class AxolotlTrainer(
num_workers=self.args.dataloader_num_workers,
rank=self.args.process_index,
)
if (
self.args.accelerator_config is not None
and self.args.accelerator_config.split_batches
and self.args.accelerator_config.dispatch_batches
):
if self.args.sample_packing and self.args.pretraining:
if not self.args.eval_sample_packing and not is_training:
dataloader_params["batch_size"] *= self.accelerator.num_processes
else:
dataloader_params["batch_size"] = self.accelerator.num_processes
elif not self.args.sample_packing and self.args.pretraining:
dataloader_params["batch_size"] *= self.accelerator.num_processes
if self.args.sample_packing and (
(is_training and not self.args.pretraining)
or (not is_training and self.args.eval_sample_packing is not False)

View File