migrate example configs to canonical attn_implementation
This commit is contained in:
@@ -58,7 +58,7 @@ gradient_checkpointing: true
|
||||
resume_from_checkpoint:
|
||||
logging_steps: 1
|
||||
# flash_attention: true # Not supported
|
||||
sdp_attention: true
|
||||
attn_implementation: sdpa
|
||||
|
||||
warmup_ratio: 0.1
|
||||
evals_per_epoch: 1
|
||||
|
||||
Reference in New Issue
Block a user