From 5bb1f3da5605548eac9e4bf338a351e29b2ea02c Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Wed, 30 Apr 2025 14:32:23 +0700 Subject: [PATCH] feat: add qwen3 moe block for ds3 (#2596) [skip ci] --- src/axolotl/common/architectures.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/axolotl/common/architectures.py b/src/axolotl/common/architectures.py index 827a63c07..2f77b613e 100644 --- a/src/axolotl/common/architectures.py +++ b/src/axolotl/common/architectures.py @@ -11,5 +11,6 @@ MOE_ARCH_BLOCK = { ], "mixtral": "MixtralSparseMoeBlock", "qwen2_moe": "Qwen2MoeSparseMoeBlock", + "qwen3_moe": "Qwen3MoeSparseMoeBlock", "deepseek_v2": "DeepseekV2MoE", }