drop position_ids for olmo model
This commit is contained in:
@@ -197,6 +197,12 @@ def process_datasets_for_packing(cfg, train_dataset, eval_dataset):
|
||||
if eval_dataset:
|
||||
eval_dataset = eval_dataset.remove_columns("attention_mask")
|
||||
|
||||
if cfg.model_config_type == "olmo":
|
||||
LOG.info("dropping position_ids column")
|
||||
train_dataset = train_dataset.remove_columns("position_ids")
|
||||
if eval_dataset:
|
||||
eval_dataset = eval_dataset.remove_columns("position_ids")
|
||||
|
||||
if cfg.model_config_type == "falcon":
|
||||
LOG.info("dropping token_type_ids column if it exists")
|
||||
if "token_type_ids" in train_dataset.column_names:
|
||||
|
||||
Reference in New Issue
Block a user