This commit is contained in:
Wing Lian
2023-06-15 08:43:20 -04:00
parent 6d0ee4ba34
commit c969f0a9dc

View File

@@ -422,6 +422,12 @@ log_sweep_max_lr:
optimizer:
# specify weight decay
weight_decay:
# adamw hyperparams
adam_beta1:
adam_beta2:
adam_epsilon:
# Gradient clipping max norm
max_grad_norm:
# whether to bettertransformers
flash_optimum: