From 380921ee5633b07a8a3451705efd432f02d9e06f Mon Sep 17 00:00:00 2001 From: mhenrhcsen Date: Thu, 17 Jul 2025 19:53:41 +0200 Subject: [PATCH] Update ModelLoader to set default vocab_size if not defined in model config, enhancing compatibility with tokenizer defaults. --- src/axolotl/loaders/model.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/axolotl/loaders/model.py b/src/axolotl/loaders/model.py index 63bdc7004..c4621a30c 100644 --- a/src/axolotl/loaders/model.py +++ b/src/axolotl/loaders/model.py @@ -762,6 +762,10 @@ class ModelLoader: ) else: + if not hasattr(self.model_config, 'vocab_size'): + LOG.warning("Model config does not have vocab_size attribute, setting to 50257") + self.model_config.vocab_size = 50257 + self.model = getattr(transformers, self.model_type).from_pretrained( self.base_model, config=self.model_config,