Merge pull request #32 from NanoCode012/patch-2

Feat: Set `half` using `cfg.fp16` for 4bit
This commit is contained in:
Wing Lian
2023-05-20 18:21:02 -04:00
committed by GitHub

View File

@@ -112,6 +112,7 @@ def load_model(
base_model_config if base_model_config else base_model,
model_path,
device_map=cfg.device_map,
half=cfg.fp16,
groupsize=cfg.gptq_groupsize if cfg.gptq_groupsize else -1,
is_v1_model=cfg.gptq_model_v1
if cfg.gptq_model_v1 is not None