adding 'reward_processing_classes'
This commit is contained in:
@@ -53,6 +53,10 @@ class GRPOStrategy:
|
||||
for reward_func_fqn in cfg.grpo_reward_funcs:
|
||||
reward_funcs.append(cls.get_reward_func(reward_func_fqn))
|
||||
trainer_kwargs["reward_funcs"] = reward_funcs
|
||||
if cfg.grpo_reward_processing_classes:
|
||||
trainer_kwargs[
|
||||
"reward_processing_classes"
|
||||
] = cfg.grpo_reward_processing_classes
|
||||
return trainer_kwargs
|
||||
|
||||
@classmethod
|
||||
|
||||
Reference in New Issue
Block a user