Merge pull request #268 from OpenAccess-AI-Collective/fix-adam-args
params are adam_*, not adamw_*
This commit is contained in:
@@ -87,7 +87,7 @@ def validate_config(cfg):
|
||||
"You probably want to disable group_by_length as it will force a streamed dataset to download completely."
|
||||
)
|
||||
|
||||
if any([cfg.adamw_beta1, cfg.adamw_beta2, cfg.adamw_epsilon]) and (
|
||||
if any([cfg.adam_beta1, cfg.adam_beta2, cfg.adam_epsilon]) and (
|
||||
not cfg.optimizer or "adamw" not in cfg.optimizer
|
||||
):
|
||||
logging.warning("adamw hyperparameters found, but no adamw optimizer set")
|
||||
|
||||
@@ -268,7 +268,7 @@ class ValidationTest(unittest.TestCase):
|
||||
cfg = DictDefault(
|
||||
{
|
||||
"optimizer": None,
|
||||
"adamw_epsilon": 0.0001,
|
||||
"adam_epsilon": 0.0001,
|
||||
}
|
||||
)
|
||||
|
||||
@@ -283,7 +283,7 @@ class ValidationTest(unittest.TestCase):
|
||||
cfg = DictDefault(
|
||||
{
|
||||
"optimizer": "adafactor",
|
||||
"adamw_beta1": 0.0001,
|
||||
"adam_beta1": 0.0001,
|
||||
}
|
||||
)
|
||||
|
||||
@@ -298,9 +298,9 @@ class ValidationTest(unittest.TestCase):
|
||||
cfg = DictDefault(
|
||||
{
|
||||
"optimizer": "adamw_bnb_8bit",
|
||||
"adamw_beta1": 0.0001,
|
||||
"adamw_beta2": 0.0001,
|
||||
"adamw_epsilon": 0.0001,
|
||||
"adam_beta1": 0.9,
|
||||
"adam_beta2": 0.99,
|
||||
"adam_epsilon": 0.0001,
|
||||
}
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user