make the train_on_eos default to turn so all eos tokens are treated the same (#1847) [skip ci]

This commit is contained in:
Wing Lian
2024-08-22 11:45:37 -04:00
committed by GitHub
parent 5b0b774e38
commit 9caa3eb699

View File

@@ -357,7 +357,7 @@ def load(tokenizer, cfg, ds_cfg: Optional[Dict[str, Any]] = None):
"train_on_inputs": cfg.train_on_inputs,
"sequence_len": cfg.sequence_len,
"roles_to_train": ds_cfg.get("roles_to_train", ["gpt", "assistant"]),
"train_on_eos": ds_cfg.get("train_on_eos", "last"),
"train_on_eos": ds_cfg.get("train_on_eos", "turn"),
}
strategy = ChatTemplateStrategy(