optimize dataloading to use cache, fix model token embedding sizes
This commit is contained in:
@@ -181,6 +181,8 @@ def load_model(
|
||||
for k, v in cfg.tokens.items():
|
||||
tokenizer.add_special_tokens({k: v})
|
||||
|
||||
model.resize_token_embeddings(len(tokenizer))
|
||||
|
||||
if cfg.adapter and load_in_8bit and not cfg.load_4bit:
|
||||
logging.info("converting PEFT model w/ prepare_model_for_int8_training")
|
||||
model = prepare_model_for_int8_training(model)
|
||||
|
||||
Reference in New Issue
Block a user