From 0bbad9202cc7ce08883c951648dd85b6d4b96051 Mon Sep 17 00:00:00 2001 From: NanoCode012 Date: Thu, 7 Aug 2025 13:10:48 +0700 Subject: [PATCH] feat: add glm4moemoe to z3 --- src/axolotl/common/architectures.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/src/axolotl/common/architectures.py b/src/axolotl/common/architectures.py index ce945e670..616b4159b 100644 --- a/src/axolotl/common/architectures.py +++ b/src/axolotl/common/architectures.py @@ -13,5 +13,7 @@ MOE_ARCH_BLOCK = { "qwen2_moe": "Qwen2MoeSparseMoeBlock", "qwen3_moe": "Qwen3MoeSparseMoeBlock", "deepseek_v2": "DeepseekV2MoE", - "gpt_oss": "GptOssDecoderLayer", + "gpt_oss": "GptOssExperts", + "deepseek_v3": "DeepseekV3MoE", + "glm4_moe": "Glm4MoeMoE", }