diff --git a/examples/lora-openllama-3b/config.yml b/examples/lora-openllama-3b/config.yml index 393942d96..6665044e0 100644 --- a/examples/lora-openllama-3b/config.yml +++ b/examples/lora-openllama-3b/config.yml @@ -13,7 +13,7 @@ dataset_prepared_path: last_run_prepared val_set_size: 0.02 adapter: lora lora_model_dir: -sequence_len: 512 +sequence_len: 256 max_packed_sequence_len: lora_r: 8 lora_alpha: 16 @@ -43,7 +43,7 @@ train_on_inputs: false group_by_length: false bf16: false fp16: true -tf32: true +tf32: false gradient_checkpointing: true early_stopping_patience: resume_from_checkpoint: