small batch size

This commit is contained in:
Mads Henrichsen
2023-12-30 13:20:45 +01:00
parent 97943d8fc4
commit e3716db386

View File

@@ -3,7 +3,7 @@ model_type: AutoModelForCausalLM
tokenizer_type: AutoTokenizer
is_mistral_derived_model: false
trust_remote_code: true
model_revision: refs/pr/5
load_in_8bit: false
load_in_4bit: true
@@ -43,8 +43,8 @@ wandb_watch:
wandb_name:
wandb_log_model:
gradient_accumulation_steps: 4
micro_batch_size: 2
gradient_accumulation_steps: 1
micro_batch_size: 1
num_epochs: 1
optimizer: adamw_bnb_8bit
lr_scheduler: cosine