support for QAT w RL (DPO) (#2776)

This commit is contained in:
Wing Lian
2025-06-13 10:00:35 -04:00
committed by GitHub
parent eac4a61f55
commit b2274d430b
9 changed files with 152 additions and 32 deletions

View File

@@ -5,6 +5,10 @@ tokenizer_type: AutoTokenizer
# Automatically upload checkpoint and final model to HF
# hub_model_id: username/custom_model_name
special_tokens:
pad_token: <|finetune_right_pad_id|>
eos_token: <|eot_id|>
load_in_8bit: true
load_in_4bit: false