From 3750d7dd64a2c0699d5009392d85de525f7414c6 Mon Sep 17 00:00:00 2001 From: VED <146507396+ved1beta@users.noreply.github.com> Date: Thu, 18 Dec 2025 21:41:06 +0530 Subject: [PATCH] add liger support kernal for dpo (#3302) * add liger kernal 4 dpo * revert grpo changes,add support in dpo * revert grpo changes,add support in dpo * dpo_use_liger_kernal * fix liger_dpo --------- Co-authored-by: Ved --- src/axolotl/core/trainers/dpo/__init__.py | 2 ++ src/axolotl/utils/schemas/config.py | 6 ++++++ 2 files changed, 8 insertions(+) diff --git a/src/axolotl/core/trainers/dpo/__init__.py b/src/axolotl/core/trainers/dpo/__init__.py index 3aa79c484..5e160e692 100644 --- a/src/axolotl/core/trainers/dpo/__init__.py +++ b/src/axolotl/core/trainers/dpo/__init__.py @@ -36,4 +36,6 @@ class DPOStrategy: training_args_kwargs["dpo_norm_loss"] = cfg.dpo_norm_loss if cfg.dpo_use_logits_to_keep is not None: training_args_kwargs["use_logits_to_keep"] = cfg.dpo_use_logits_to_keep + if cfg.dpo_use_liger_kernel is not None: + training_args_kwargs["use_liger_kernel"] = cfg.dpo_use_liger_kernel return training_args_kwargs diff --git a/src/axolotl/utils/schemas/config.py b/src/axolotl/utils/schemas/config.py index c9b087ea3..bd6a61177 100644 --- a/src/axolotl/utils/schemas/config.py +++ b/src/axolotl/utils/schemas/config.py @@ -173,6 +173,12 @@ class AxolotlInputConfig( dpo_use_logits_to_keep: bool | None = None dpo_label_smoothing: float | None = None dpo_norm_loss: bool | None = None + + dpo_use_liger_kernel: bool | None = Field( + default=None, + json_schema_extra={"description": "Whether to use Liger kernel for DPO loss."}, + ) + dpo_padding_free: bool | None = None dpo_generate_during_eval: bool | None = None