diff --git a/src/axolotl/utils/models.py b/src/axolotl/utils/models.py index 6cd1cd7ea..063e43977 100644 --- a/src/axolotl/utils/models.py +++ b/src/axolotl/utils/models.py @@ -356,7 +356,7 @@ def load_model( if hasattr(module, "weight"): module.to(torch.float32) - needs_fa2_dtype = cfg.adapter is not None + needs_fa2_dtype = cfg.adapter or cfg.fsdp if not cfg.gptq and ( (cfg.adapter == "lora" and load_in_8bit) or (cfg.adapter == "qlora" and cfg.load_in_4bit)