diff --git a/examples/pixtral/lora-12b.yml b/examples/pixtral/lora-12b.yml index 88fb02be5..8e8373d59 100644 --- a/examples/pixtral/lora-12b.yml +++ b/examples/pixtral/lora-12b.yml @@ -50,7 +50,7 @@ tf32: true gradient_checkpointing: true local_rank: logging_steps: 1 -flash_attention: true +flash_attention: false eager_attention: warmup_ratio: 0.1