Feat: Rework multimodal support (mllama, llava, pixtral, qwen2, qwen25, gemma3, mistral3) (#2435)

This commit is contained in:
NanoCode012
2025-03-23 22:08:51 +07:00
committed by GitHub
parent 9f00465a5c
commit a9b0733f2c
19 changed files with 971 additions and 184 deletions

View File

@@ -58,7 +58,7 @@ class TestGemma3Text:
"bos_token": "<bos>",
"eos_token": "<eos>",
},
"chat_template": "gemma3_text",
"chat_template": "gemma3",
"num_epochs": 1,
"micro_batch_size": 1,
"gradient_accumulation_steps": 4,
@@ -105,7 +105,7 @@ class TestGemma3Text:
"split": "train[:1%]",
},
],
"chat_template": "gemma3_text",
"chat_template": "gemma3",
"special_tokens": {
"bos_token": "<bos>",
"eos_token": "<eos>",