workaround so training doesn't hang when packed dataloader batches aren't even (#461)

* workaround so training doesn't hang when packed dataloader batches aren't even * don't bother labeling anything in the no-op data
2023-08-23 10:39:11 -04:00
parent d5dcf9c350
commit c69faee7a7
1 changed files with 12 additions and 0 deletions
--- a/src/axolotl/utils/dataloader.py
+++ b/src/axolotl/utils/dataloader.py
@@ -243,6 +243,18 @@ class MultipackDistributedDataloader:
            len_remaining -= 1
            if not len_remaining:
                return
        # yield a no-op for cases where we don't have any data left to pack
        for i in range(0, len_remaining):
            yield self.collate_fn(
                [
                    {
                        "input_ids": [0],
                        "labels": [-100],
                        "attention_mask": [True],
                        "position_ids": [0],
                    }
                ]
            )
    def _len_est(self):
        lengths_sum = np.sum(self.lengths)