ignore: address pr review

This commit is contained in:
Maxime
2023-08-26 22:45:45 +02:00
committed by GitHub
parent a184549e4c
commit d03887fad5

View File

@@ -368,7 +368,7 @@ def load_model(
# LlamaRMSNorm layers are in fp32 after kbit_training or full finetune, so we need to
# convert them back to fp16/bf16 for flash-attn compatibility.
if (fix_dtype or cfg.adapter == "" or cfg.adapter is None) and (
if (fix_dtype or not cfg.adapter) and (
cfg.flash_attention and cfg.is_llama_derived_model
):
for name, module in model.named_modules():