diff --git a/.nojekyll b/.nojekyll index 7dc9a4cc9..3366cdb39 100644 --- a/.nojekyll +++ b/.nojekyll @@ -1 +1 @@ -51905dfe \ No newline at end of file +e1e28bc6 \ No newline at end of file diff --git a/docs/multimodal.html b/docs/multimodal.html index eda17b8dd..67051594b 100644 --- a/docs/multimodal.html +++ b/docs/multimodal.html @@ -511,6 +511,7 @@ gtag('config', 'G-9KYCVJBNMQ', { 'anonymize_ip': true});
base_model: mistralai/Mistral-Small-3.1-24B-Instruct-2503
-
-chat_template: mistral_v7_tekkenPlease make sure to install vision lib via pip install 'mistral-common[opencv]==1.8.5'
base_model: mistralai/Mistral-Small-3.1-24B-Instruct-2503Please make sure to install vision lib via pip install 'mistral-common[opencv]==1.8.5'
base_model: mistralai/Magistral-Small-2509Please make sure to install audio lib via pip3 install librosa==0.11.0 'mistral_common[audio]==1.8.3'
base_model: mistralai/Voxtral-Mini-3B-2507base_model: mistralai/Voxtral-Mini-3B-2507For multi-modal 4B/12B/27B models, use the following config:
-base_model: google/gemma-3-4b-it
-
-chat_template: gemma3base_model: google/gemma-3-4b-it
+
+chat_template: gemma3Please make sure to install timm via pip3 install timm==1.0.17
base_model: google/gemma-3n-E2B-it
-
-chat_template: gemma3nbase_model: google/gemma-3n-E2B-it
+
+chat_template: gemma3nbase_model: Qwen/Qwen2-VL-7B-Instruct
-
-chat_template: qwen2_vlbase_model: Qwen/Qwen2-VL-7B-Instruct
+
+chat_template: qwen2_vlbase_model: Qwen/Qwen2.5-VL-7B-Instruct
-
-chat_template: qwen2_vl # same as qwen2-vlbase_model: Qwen/Qwen2.5-VL-7B-Instruct
+
+chat_template: qwen2_vl # same as qwen2-vlPlease make sure to install num2words via pip3 install num2words==0.5.14
base_model: HuggingFaceTB/SmolVLM2-500M-Video-Instructbase_model: HuggingFaceTB/SmolVLM2-500M-Video-InstructPlease uninstall causal-conv1d via pip3 uninstall -y causal-conv1d
base_model: LiquidAI/LFM2-VL-450Mbase_model: LiquidAI/LFM2-VL-450MHere is an example of a multi-modal dataset:
-[
- {
- "messages": [
- {
- "role": "system",
- "content": [
- {"type": "text", "text": "You are a helpful assistant."}
- ]
- },
- {
- "role": "user",
- "content": [
- {"type": "image", "url": "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/bee.jpg"},
- {"type": "text", "text": "Describe this image in detail."}
- ]
- },
- {
- "role": "assistant",
- "content": [
- {"type": "text", "text": "The image is a bee."}
- ]
- }
- ]
- }
-][
+ {
+ "messages": [
+ {
+ "role": "system",
+ "content": [
+ {"type": "text", "text": "You are a helpful assistant."}
+ ]
+ },
+ {
+ "role": "user",
+ "content": [
+ {"type": "image", "url": "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/bee.jpg"},
+ {"type": "text", "text": "Describe this image in detail."}
+ ]
+ },
+ {
+ "role": "assistant",
+ "content": [
+ {"type": "text", "text": "The image is a bee."}
+ ]
+ }
+ ]
+ }
+]