diff --git a/src/axolotl/utils/models.py b/src/axolotl/utils/models.py index 4fad740c5..64c80109e 100644 --- a/src/axolotl/utils/models.py +++ b/src/axolotl/utils/models.py @@ -55,10 +55,15 @@ def load_tokenizer(cfg): **tokenizer_kwargs, ) - if tokenizer.__class__.__name__ in [ - "LlamaTokenizer", - "LlamaTokenizerFast", - ] and not hasattr(tokenizer, "pad_token"): + if ( + tokenizer.__class__.__name__ + in [ + "LlamaTokenizer", + "LlamaTokenizerFast", + ] + and hasattr(tokenizer, "pad_token") + and not tokenizer.pad_token + ): # set a pad_token, but use eos_token so we don't add a new token tokenizer.pad_token = LLAMA_DEFAULT_EOS_TOKEN