use smaller pretrained models for ci (#3620) [skip ci]

* use smaller pretrained models for ci * more steps for loss check * fix tests * more train steps * fix losses
2026-04-27 13:22:56 -04:00
parent 798c8fba89
commit ac77da96da
24 changed files with 716 additions and 288 deletions
--- a/tests/e2e/kernels/test_lora_features.py
+++ b/tests/e2e/kernels/test_lora_features.py
@@ -24,7 +24,7 @@ from axolotl.monkeypatch.lora_kernels import (
 )
 from axolotl.utils.dict import DictDefault

-MODEL_NAME = "Qwen/Qwen3-0.6B"
+MODEL_NAME = "axolotl-ai-co/tiny-qwen3-129m"
 DEVICE = "cuda"
 DTYPE = torch.bfloat16