replace references to random 68m model w 135m smollm2 (#2570) [skip ci]

* replace references to random 68m model w 135m smollm2

* use AutoTokenizer for smollm2
This commit is contained in:
Wing Lian
2025-04-28 10:08:07 -04:00
committed by GitHub
parent f1df73a798
commit 40f4ea23ab
13 changed files with 95 additions and 87 deletions

View File

@@ -18,9 +18,9 @@ class TestModelsUtils:
# load config
self.cfg = DictDefault( # pylint: disable=attribute-defined-outside-init
{
"base_model": "JackFram/llama-68m",
"model_type": "LlamaForCausalLM",
"tokenizer_type": "LlamaTokenizer",
"base_model": "HuggingFaceTB/SmolLM2-135M",
"model_type": "AutoModelForCausalLM",
"tokenizer_type": "AutoTokenizer",
"load_in_8bit": True,
"load_in_4bit": False,
"adapter": "lora",
@@ -65,7 +65,7 @@ class TestModelsUtils:
"s2_attention": True,
"sample_packing": True,
"base_model": "",
"model_type": "LlamaForCausalLM",
"model_type": "AutoModelForCausalLM",
}
)