new lr, sample pack

This commit is contained in:
mhenrichsen
2023-10-06 22:58:13 +02:00
parent 669f1d052c
commit 4c8ddf2c6f

View File

@@ -16,8 +16,8 @@ val_set_size: 0.01
output_dir: ./out output_dir: ./out
sequence_len: 8192 sequence_len: 8192
sample_packing: sample_packing: true
pad_to_sequence_len: pad_to_sequence_len: true
wandb_project: wandb_project:
wandb_entity: wandb_entity:
@@ -30,7 +30,7 @@ micro_batch_size: 2
num_epochs: 3 num_epochs: 3
optimizer: adamw_bnb_8bit optimizer: adamw_bnb_8bit
lr_scheduler: cosine lr_scheduler: cosine
learning_rate: 0.0002 learning_rate: 0.000005
train_on_inputs: false train_on_inputs: false
group_by_length: false group_by_length: false