passthrough dataset parser for dpo/grpo
This commit is contained in:
@@ -10,3 +10,5 @@ class AxolotlGRPOTrainer(SchedulerMixin, GRPOTrainer):
|
|||||||
"""
|
"""
|
||||||
Extend the base GRPOTrainer for axolotl helpers
|
Extend the base GRPOTrainer for axolotl helpers
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
_tag_names = ["trl", "grpo", "axolotl"]
|
||||||
|
|||||||
14
src/axolotl/prompt_strategies/dpo/passthrough.py
Normal file
14
src/axolotl/prompt_strategies/dpo/passthrough.py
Normal file
@@ -0,0 +1,14 @@
|
|||||||
|
"""
|
||||||
|
DPO prompt strategies passthrough/zero-processing strategy
|
||||||
|
"""
|
||||||
|
|
||||||
|
|
||||||
|
def default(
|
||||||
|
cfg, dataset_idx=0, **kwargs
|
||||||
|
): # pylint: disable=possibly-unused-variable,unused-argument
|
||||||
|
def transform_fn(
|
||||||
|
sample, tokenizer=None
|
||||||
|
): # pylint: disable=possibly-unused-variable,unused-argument
|
||||||
|
return sample
|
||||||
|
|
||||||
|
return transform_fn
|
||||||
Reference in New Issue
Block a user