add doc + requirement for hqq

This commit is contained in:
Sunny Liu
2025-04-18 00:26:35 -04:00
committed by Sung Ching Liu
parent 0c40d12a18
commit 0e9b060b4d
3 changed files with 21 additions and 2 deletions

View File

@@ -63,6 +63,24 @@ bnb_config_kwargs:
bnb_4bit_quant_type: nf4
bnb_4bit_use_double_quant: true
# Overrides quantization method to use HQQ instead of default bnb.
# See: https://huggingface.co/docs/transformers/main/en//quantization/hqq
# https://github.com/mobiusml/hqq
use_hqq: true
hqq_config:
- nbits: 4
group_size: 64
target_modules:
- self_attn.k_proj
- self_attn.v_proj
- self_attn.o_proj
- nbits: 3
group_size: 32
target_modules:
- mlp.gate_proj
- mlp.up_proj
- mlp.down_proj
# Whether you are training a 4-bit GPTQ quantized model
gptq: true

View File

@@ -22,6 +22,7 @@ hf_xet==1.0.0
optimum==1.16.2
hf_transfer
hqq
sentencepiece
gradio==5.23.3

View File

@@ -44,7 +44,7 @@ from axolotl.utils.schemas.model import (
)
from axolotl.utils.schemas.multimodal import MultiModalConfig
from axolotl.utils.schemas.peft import LoraConfig, ReLoRAConfig
from axolotl.utils.schemas.quant import HQQConfig
from axolotl.utils.schemas.quant import QuantizationConfig
from axolotl.utils.schemas.training import HyperparametersConfig
from axolotl.utils.schemas.trl import TRLConfig
from axolotl.utils.schemas.vllm import VllmConfig
@@ -60,7 +60,7 @@ class AxolotlInputConfig(
ModelOutputConfig,
LoraConfig,
ReLoRAConfig,
HQQConfig,
QuantizationConfig,
HyperparametersConfig,
WandbConfig,
MLFlowConfig,