add validation and tests for adamw hyperparam

This commit is contained in:
Wing Lian
2023-06-15 09:39:42 -04:00
parent c969f0a9dc
commit cb9d3af5c0
2 changed files with 47 additions and 0 deletions

View File

@@ -87,6 +87,11 @@ def validate_config(cfg):
"You probably want to disable group_by_length as it will force a streamed dataset to download completely."
)
if any([cfg.adamw_beta1, cfg.adamw_beta2, cfg.adamw_epsilon]) and (
not cfg.optimizer or "adamw" not in cfg.optimizer
):
logging.warning("adamw hyperparameters found, but no adamw optimizer set")
# TODO
# MPT 7b
# https://github.com/facebookresearch/bitsandbytes/issues/25