From c969f0a9dc28c9f095a2bb6b3ecede0216d909b5 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Thu, 15 Jun 2023 08:43:20 -0400 Subject: [PATCH] add docs --- README.md | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/README.md b/README.md index d6c9cfefb..5fbac1a48 100644 --- a/README.md +++ b/README.md @@ -422,6 +422,12 @@ log_sweep_max_lr: optimizer: # specify weight decay weight_decay: +# adamw hyperparams +adam_beta1: +adam_beta2: +adam_epsilon: +# Gradient clipping max norm +max_grad_norm: # whether to bettertransformers flash_optimum: