bump to latest transformers release

This commit is contained in:
Wing Lian
2025-01-13 10:34:44 -05:00
parent af727eedf7
commit 23389b38b7
3 changed files with 8 additions and 6 deletions

View File

@@ -387,15 +387,13 @@ class ModelLoader:
self.patch_attention()
if self.cfg.model_config_type == "llama":
from axolotl.monkeypatch.trainer_grad_accum import (
from axolotl.monkeypatch.trainer_grad_accum import ( # patch_forward_for_ga,; patch_training_step_for_ga,
patch_flash_attention_forward,
patch_forward_for_ga,
patch_training_step_for_ga,
)
patch_flash_attention_forward()
patch_forward_for_ga()
patch_training_step_for_ga()
# patch_forward_for_ga()
# patch_training_step_for_ga()
if self.cfg.sample_packing and self.cfg.s2_attention:
raise ValueError(