From 71bd06243c91b23182debedc2675c2eab69adcaf Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Fri, 25 Aug 2023 14:30:50 +0900 Subject: [PATCH] Fix(tokenizer): Fix condition to add pad token (#477) * Fix(tokenizer): Fix condition to add pad token * chore: fix lint --- src/axolotl/utils/models.py | 13 +++++++++---- 1 file changed, 9 insertions(+), 4 deletions(-) diff --git a/src/axolotl/utils/models.py b/src/axolotl/utils/models.py index 4fad740c5..64c80109e 100644 --- a/src/axolotl/utils/models.py +++ b/src/axolotl/utils/models.py @@ -55,10 +55,15 @@ def load_tokenizer(cfg): **tokenizer_kwargs, ) - if tokenizer.__class__.__name__ in [ - "LlamaTokenizer", - "LlamaTokenizerFast", - ] and not hasattr(tokenizer, "pad_token"): + if ( + tokenizer.__class__.__name__ + in [ + "LlamaTokenizer", + "LlamaTokenizerFast", + ] + and hasattr(tokenizer, "pad_token") + and not tokenizer.pad_token + ): # set a pad_token, but use eos_token so we don't add a new token tokenizer.pad_token = LLAMA_DEFAULT_EOS_TOKEN