don't check dataset labels during preprocess for GRPO (#2952) [skip ci]
* don't check dataset labels during preprocess for GRPO * use enum check per PR feedback
This commit is contained in:
@@ -122,7 +122,7 @@ def load_preference_datasets(
|
||||
math.ceil(len(train_dataset) * cfg.num_epochs / cfg.batch_size)
|
||||
)
|
||||
|
||||
if (cli_args and cli_args.debug) or cfg.debug:
|
||||
if ((cli_args and cli_args.debug) or cfg.debug) and cfg.rl != RLType.ORPO:
|
||||
LOG.info("check_dataset_labels...")
|
||||
|
||||
num_examples = cli_args.debug_num_examples if cli_args else 1
|
||||
|
||||
Reference in New Issue
Block a user