add liger support kernal for dpo (#3302)

* add liger kernal 4 dpo

* revert grpo changes,add support in dpo

* revert grpo changes,add support in dpo

* dpo_use_liger_kernal

* fix liger_dpo

---------

Co-authored-by: Ved <ved.work2024@gmail.com>
This commit is contained in:
VED
2025-12-18 21:41:06 +05:30
committed by GitHub
parent 2197b0bf89
commit 3750d7dd64
2 changed files with 8 additions and 0 deletions

View File

@@ -36,4 +36,6 @@ class DPOStrategy:
training_args_kwargs["dpo_norm_loss"] = cfg.dpo_norm_loss
if cfg.dpo_use_logits_to_keep is not None:
training_args_kwargs["use_logits_to_keep"] = cfg.dpo_use_logits_to_keep
if cfg.dpo_use_liger_kernel is not None:
training_args_kwargs["use_liger_kernel"] = cfg.dpo_use_liger_kernel
return training_args_kwargs

View File

@@ -173,6 +173,12 @@ class AxolotlInputConfig(
dpo_use_logits_to_keep: bool | None = None
dpo_label_smoothing: float | None = None
dpo_norm_loss: bool | None = None
dpo_use_liger_kernel: bool | None = Field(
default=None,
json_schema_extra={"description": "Whether to use Liger kernel for DPO loss."},
)
dpo_padding_free: bool | None = None
dpo_generate_during_eval: bool | None = None