apply chat template as arg

This commit is contained in:
Wing Lian
2025-01-12 17:38:32 -05:00
parent 530bf77cf9
commit fd91de3ea6

View File

@@ -22,6 +22,8 @@ def build_lm_eval_command(
wandb_entity=None, wandb_entity=None,
model=None, model=None,
revision=None, revision=None,
apply_chat_template=None,
fewshot_as_multiturn=None,
): ):
tasks_by_num_fewshot: dict[str, list] = defaultdict(list) tasks_by_num_fewshot: dict[str, list] = defaultdict(list)
for task in tasks: for task in tasks:
@@ -55,7 +57,6 @@ def build_lm_eval_command(
str(batch_size), str(batch_size),
"--output_path", "--output_path",
output_path, output_path,
"--apply_chat_template",
] ]
wandb_args = [] wandb_args = []
if wandb_project: if wandb_project:
@@ -65,10 +66,13 @@ def build_lm_eval_command(
if wandb_args: if wandb_args:
lm_eval_args.append("--wandb_args") lm_eval_args.append("--wandb_args")
lm_eval_args.append(",".join(wandb_args)) lm_eval_args.append(",".join(wandb_args))
if apply_chat_template:
lm_eval_args.append("--apply_chat_template")
if num_fewshot_val: if num_fewshot_val:
lm_eval_args.append("--num_fewshot") lm_eval_args.append("--num_fewshot")
lm_eval_args.append(str(num_fewshot_val)) lm_eval_args.append(str(num_fewshot_val))
# lm_eval_args.append("--fewshot_as_multiturn") if apply_chat_template and fewshot_as_multiturn:
lm_eval_args.append("--fewshot_as_multiturn")
yield lm_eval_args yield lm_eval_args
@@ -100,6 +104,8 @@ def lm_eval(config: str, cloud: Optional[str] = None):
wandb_entity=cfg.wandb_entity, wandb_entity=cfg.wandb_entity,
model=cfg.lm_eval_model or cfg.hub_model_id, model=cfg.lm_eval_model or cfg.hub_model_id,
revision=cfg.revision, revision=cfg.revision,
apply_chat_template=cfg.apply_chat_template,
fewshot_as_multiturn=cfg.fewshot_as_multiturn,
): ):
subprocess.run( # nosec subprocess.run( # nosec
lm_eval_args, lm_eval_args,