migrate example configs to canonical attn_implementation
This commit is contained in:
@@ -35,7 +35,7 @@ warmup_ratio: 0.1
|
||||
optimizer: adamw_8bit
|
||||
lr_scheduler: cosine
|
||||
learning_rate: 3e-4
|
||||
sdp_attention: true
|
||||
attn_implementation: sdpa
|
||||
|
||||
bf16: auto
|
||||
tf32: true
|
||||
|
||||
@@ -41,7 +41,7 @@ tf32: true
|
||||
|
||||
gradient_checkpointing: true
|
||||
resume_from_checkpoint:
|
||||
sdp_attention: true
|
||||
attn_implementation: sdpa
|
||||
|
||||
logging_steps: 1
|
||||
save_strategy: best
|
||||
|
||||
Reference in New Issue
Block a user