Merge pull request #37 from Thytu/main

fix: handles AutoTokenizer from untrusted source
This commit is contained in:
Wing Lian
2023-05-24 15:42:41 -04:00
committed by GitHub

View File

@@ -167,7 +167,7 @@ def load_model(
else:
tokenizer = getattr(transformers, tokenizer_type).from_pretrained(model)
except:
tokenizer = AutoTokenizer.from_pretrained(base_model_config)
tokenizer = AutoTokenizer.from_pretrained(base_model_config, trust_remote_code=True if cfg.trust_remote_code is True else False)
logging.debug(f"EOS: {tokenizer.eos_token_id} / {tokenizer.eos_token}")
logging.debug(f"BOS: {tokenizer.bos_token_id} / {tokenizer.bos_token}")