From 24907533d11102c2f10b9562feba2eca61b8e80a Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Wed, 30 Apr 2025 11:06:50 -0400 Subject: [PATCH] don't automatically enable lora kernels for RL training (#2600) --- src/axolotl/utils/schemas/config.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/axolotl/utils/schemas/config.py b/src/axolotl/utils/schemas/config.py index bc25b1ab0..7f35de81d 100644 --- a/src/axolotl/utils/schemas/config.py +++ b/src/axolotl/utils/schemas/config.py @@ -1319,6 +1319,9 @@ class AxolotlConfigWCapabilities(AxolotlInputConfig): @classmethod def check_auto_enable_lora_kernels(cls, data): # Only proceed if using LoRA or QLoRA adapter + if data.get("rl"): + # RL trainers not tested so don't enable kernels by default + return data if data.get("adapter") in ["lora", "qlora"]: # Skip if already set, using unsloth optimizations, or using 8-bit unsloth_fields = ["unsloth_lora_mlp", "unsloth_lora_qkv", "unsloth_lora_o"]