This commit is contained in:
Sunny Liu
2025-04-21 11:28:59 -04:00
parent 320aff1867
commit ffd4ef1ece

View File

@@ -58,8 +58,6 @@ overrides_of_model_kwargs:
# Quantization configuration.
# See: https://huggingface.co/docs/transformers/main/en//quantization/hqq
# https://github.com/mobiusml/hqq
quantization:
backend: bnb | hqq | gptq
bits: 8