From 641f8012f9e85a6e871495268b1f695c73a494a5 Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Sat, 20 May 2023 02:29:31 +0900 Subject: [PATCH] Set `half` using `cfg.fp16` for 4bit --- src/axolotl/utils/models.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/axolotl/utils/models.py b/src/axolotl/utils/models.py index 39845dd9f..45e771deb 100644 --- a/src/axolotl/utils/models.py +++ b/src/axolotl/utils/models.py @@ -112,6 +112,7 @@ def load_model( base_model_config if base_model_config else base_model, model_path, device_map=cfg.device_map, + half=cfg.fp16, groupsize=cfg.gptq_groupsize if cfg.gptq_groupsize else -1, is_v1_model=cfg.gptq_model_v1 if cfg.gptq_model_v1 is not None