add doc + requirement for hqq

This commit is contained in:
Sunny Liu
2025-04-18 00:26:35 -04:00
committed by Sung Ching Liu
parent 0c40d12a18
commit 0e9b060b4d
3 changed files with 21 additions and 2 deletions

View File

@@ -63,6 +63,24 @@ bnb_config_kwargs:
bnb_4bit_quant_type: nf4 bnb_4bit_quant_type: nf4
bnb_4bit_use_double_quant: true bnb_4bit_use_double_quant: true
# Overrides quantization method to use HQQ instead of default bnb.
# See: https://huggingface.co/docs/transformers/main/en//quantization/hqq
# https://github.com/mobiusml/hqq
use_hqq: true
hqq_config:
- nbits: 4
group_size: 64
target_modules:
- self_attn.k_proj
- self_attn.v_proj
- self_attn.o_proj
- nbits: 3
group_size: 32
target_modules:
- mlp.gate_proj
- mlp.up_proj
- mlp.down_proj
# Whether you are training a 4-bit GPTQ quantized model # Whether you are training a 4-bit GPTQ quantized model
gptq: true gptq: true

View File

@@ -22,6 +22,7 @@ hf_xet==1.0.0
optimum==1.16.2 optimum==1.16.2
hf_transfer hf_transfer
hqq
sentencepiece sentencepiece
gradio==5.23.3 gradio==5.23.3

View File

@@ -44,7 +44,7 @@ from axolotl.utils.schemas.model import (
) )
from axolotl.utils.schemas.multimodal import MultiModalConfig from axolotl.utils.schemas.multimodal import MultiModalConfig
from axolotl.utils.schemas.peft import LoraConfig, ReLoRAConfig from axolotl.utils.schemas.peft import LoraConfig, ReLoRAConfig
from axolotl.utils.schemas.quant import HQQConfig from axolotl.utils.schemas.quant import QuantizationConfig
from axolotl.utils.schemas.training import HyperparametersConfig from axolotl.utils.schemas.training import HyperparametersConfig
from axolotl.utils.schemas.trl import TRLConfig from axolotl.utils.schemas.trl import TRLConfig
from axolotl.utils.schemas.vllm import VllmConfig from axolotl.utils.schemas.vllm import VllmConfig
@@ -60,7 +60,7 @@ class AxolotlInputConfig(
ModelOutputConfig, ModelOutputConfig,
LoraConfig, LoraConfig,
ReLoRAConfig, ReLoRAConfig,
HQQConfig, QuantizationConfig,
HyperparametersConfig, HyperparametersConfig,
WandbConfig, WandbConfig,
MLFlowConfig, MLFlowConfig,