From d0c4930dd54685d15643617b23033c6f900f854f Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Wed, 7 May 2025 16:55:01 +0700 Subject: [PATCH] fix: set replit mpt model to use eager attention --- examples/replit-3b/config-lora.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/replit-3b/config-lora.yml b/examples/replit-3b/config-lora.yml index 7ffa0bf98..6cccc4e1e 100644 --- a/examples/replit-3b/config-lora.yml +++ b/examples/replit-3b/config-lora.yml @@ -38,7 +38,7 @@ tf32: true gradient_checkpointing: resume_from_checkpoint: logging_steps: 1 -attention: flash +attention: eager gptq_groupsize: gptq_model_v1: warmup_steps: 20