adding 'reward_processing_classes'
This commit is contained in:
@@ -53,6 +53,10 @@ class GRPOStrategy:
|
|||||||
for reward_func_fqn in cfg.grpo_reward_funcs:
|
for reward_func_fqn in cfg.grpo_reward_funcs:
|
||||||
reward_funcs.append(cls.get_reward_func(reward_func_fqn))
|
reward_funcs.append(cls.get_reward_func(reward_func_fqn))
|
||||||
trainer_kwargs["reward_funcs"] = reward_funcs
|
trainer_kwargs["reward_funcs"] = reward_funcs
|
||||||
|
if cfg.grpo_reward_processing_classes:
|
||||||
|
trainer_kwargs[
|
||||||
|
"reward_processing_classes"
|
||||||
|
] = cfg.grpo_reward_processing_classes
|
||||||
return trainer_kwargs
|
return trainer_kwargs
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
|
|||||||
Reference in New Issue
Block a user