diff --git a/examples/yayi2-30b/qlora.yml b/examples/yayi2-30b/qlora.yml index a6500104e..3d4cd0a50 100644 --- a/examples/yayi2-30b/qlora.yml +++ b/examples/yayi2-30b/qlora.yml @@ -3,7 +3,7 @@ model_type: AutoModelForCausalLM tokenizer_type: AutoTokenizer is_mistral_derived_model: false trust_remote_code: true -model_revision: refs/pr/5 + load_in_8bit: false load_in_4bit: true @@ -43,8 +43,8 @@ wandb_watch: wandb_name: wandb_log_model: -gradient_accumulation_steps: 4 -micro_batch_size: 2 +gradient_accumulation_steps: 1 +micro_batch_size: 1 num_epochs: 1 optimizer: adamw_bnb_8bit lr_scheduler: cosine