From ae8ae7534c338b37beee92d36c7ba078ac6aacdb Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Wed, 30 Apr 2025 14:32:23 +0700 Subject: [PATCH] feat: add qwen3 moe block for ds3 (#2596) [skip ci] --- src/axolotl/common/architectures.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/axolotl/common/architectures.py b/src/axolotl/common/architectures.py index 827a63c07..2f77b613e 100644 --- a/src/axolotl/common/architectures.py +++ b/src/axolotl/common/architectures.py @@ -11,5 +11,6 @@ MOE_ARCH_BLOCK = { ], "mixtral": "MixtralSparseMoeBlock", "qwen2_moe": "Qwen2MoeSparseMoeBlock", + "qwen3_moe": "Qwen3MoeSparseMoeBlock", "deepseek_v2": "DeepseekV2MoE", }