From 38adf5cd37f4d99b0d488892d96d85ff81f4f2e1 Mon Sep 17 00:00:00 2001 From: tocmo0nlord Date: Wed, 13 May 2026 13:32:46 +0000 Subject: [PATCH] add trust_remote_code, explicit bfloat16 and bnb dtype settings --- human_chat_qlora.yml | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/human_chat_qlora.yml b/human_chat_qlora.yml index 0ff381e14..ba5f68a52 100644 --- a/human_chat_qlora.yml +++ b/human_chat_qlora.yml @@ -18,6 +18,13 @@ tokenizer_type: AutoTokenizer load_in_4bit: true strict: false +trust_remote_code: true + +# Explicit dtype settings to avoid weight conversion errors +torch_dtype: bfloat16 +bnb_4bit_use_double_quant: true +bnb_4bit_quant_type: nf4 +bnb_4bit_compute_dtype: bfloat16 # --- System prompt baked into every conversation --- # This is the primary lever for "no error correcting, more human-like"