passthrough dataset parser for dpo/grpo

This commit is contained in:
Wing Lian
2025-02-02 23:36:22 -05:00
parent 59ad21f2de
commit 54b0d3d0e8
2 changed files with 16 additions and 0 deletions

View File

@@ -10,3 +10,5 @@ class AxolotlGRPOTrainer(SchedulerMixin, GRPOTrainer):
"""
Extend the base GRPOTrainer for axolotl helpers
"""
_tag_names = ["trl", "grpo", "axolotl"]

View File

@@ -0,0 +1,14 @@
"""
DPO prompt strategies passthrough/zero-processing strategy
"""
def default(
cfg, dataset_idx=0, **kwargs
): # pylint: disable=possibly-unused-variable,unused-argument
def transform_fn(
sample, tokenizer=None
): # pylint: disable=possibly-unused-variable,unused-argument
return sample
return transform_fn