new lr, sample pack

This commit is contained in:
mhenrichsen
2023-10-06 22:58:13 +02:00
parent 669f1d052c
commit 4c8ddf2c6f

View File

@@ -16,8 +16,8 @@ val_set_size: 0.01
output_dir: ./out
sequence_len: 8192
sample_packing:
pad_to_sequence_len:
sample_packing: true
pad_to_sequence_len: true
wandb_project:
wandb_entity:
@@ -30,7 +30,7 @@ micro_batch_size: 2
num_epochs: 3
optimizer: adamw_bnb_8bit
lr_scheduler: cosine
learning_rate: 0.0002
learning_rate: 0.000005
train_on_inputs: false
group_by_length: false