pr comments addressed
This commit is contained in:
@@ -13,7 +13,7 @@ dataset_prepared_path: last_run_prepared
|
|||||||
val_set_size: 0.02
|
val_set_size: 0.02
|
||||||
adapter: lora
|
adapter: lora
|
||||||
lora_model_dir:
|
lora_model_dir:
|
||||||
sequence_len: 512
|
sequence_len: 256
|
||||||
max_packed_sequence_len:
|
max_packed_sequence_len:
|
||||||
lora_r: 8
|
lora_r: 8
|
||||||
lora_alpha: 16
|
lora_alpha: 16
|
||||||
@@ -43,7 +43,7 @@ train_on_inputs: false
|
|||||||
group_by_length: false
|
group_by_length: false
|
||||||
bf16: false
|
bf16: false
|
||||||
fp16: true
|
fp16: true
|
||||||
tf32: true
|
tf32: false
|
||||||
gradient_checkpointing: true
|
gradient_checkpointing: true
|
||||||
early_stopping_patience:
|
early_stopping_patience:
|
||||||
resume_from_checkpoint:
|
resume_from_checkpoint:
|
||||||
|
|||||||
Reference in New Issue
Block a user