new lr, sample pack

This commit is contained in:
mhenrichsen
2023-10-06 22:58:13 +02:00
parent 669f1d052c
commit 4c8ddf2c6f

View File

@@ -16,8 +16,8 @@ val_set_size: 0.01
output_dir: ./out
sequence_len: 8192
sample_packing:
pad_to_sequence_len:
sample_packing: true
pad_to_sequence_len: true
wandb_project:
wandb_entity:
@@ -30,7 +30,7 @@ micro_batch_size: 2
num_epochs: 3
optimizer: adamw_bnb_8bit
lr_scheduler: cosine
learning_rate: 0.0002
learning_rate: 0.000005
train_on_inputs: false
group_by_length: false
@@ -59,4 +59,4 @@ fsdp_config:
special_tokens:
bos_token: "<s>"
eos_token: "</s>"
unk_token: "<unk>"
unk_token: "<unk>"