From a4329b10680e39003de533d1ba3f7c80734e1a01 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Sun, 7 May 2023 18:30:48 -0400 Subject: [PATCH] fix #16 load best model setting when using 8bit --- src/axolotl/utils/trainer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/axolotl/utils/trainer.py b/src/axolotl/utils/trainer.py index 5569a38ae..6535c2a7e 100644 --- a/src/axolotl/utils/trainer.py +++ b/src/axolotl/utils/trainer.py @@ -97,7 +97,7 @@ def setup_trainer(cfg, train_dataset, eval_dataset, model, tokenizer): output_dir=cfg.output_dir, save_total_limit=3, load_best_model_at_end=True - if cfg.val_set_size > 0 and save_steps % eval_steps == 0 + if cfg.val_set_size > 0 and save_steps % eval_steps == 0 and cfg.load_in_8bit is not True else False, ddp_find_unused_parameters=False if cfg.ddp else None, group_by_length=cfg.group_by_length,