Correct name of MixtralBlockSparseTop2MLP (L -> l) (#1667)

This commit is contained in:
Seungduk Kim
2024-05-29 07:10:29 +09:00
committed by GitHub
parent 6a5a725f10
commit 65db903714

View File

@@ -42,9 +42,9 @@ def patch_mixtral_moe_forward_zero3() -> None:
return final_hidden_states, router_logits return final_hidden_states, router_logits
from transformers.models.mixtral.modeling_mixtral import ( from transformers.models.mixtral.modeling_mixtral import (
MixtralBLockSparseTop2MLP, MixtralBlockSparseTop2MLP,
MixtralSparseMoeBlock, MixtralSparseMoeBlock,
) )
MixtralBLockSparseTop2MLP.forward = mlp_forward MixtralBlockSparseTop2MLP.forward = mlp_forward
MixtralSparseMoeBlock.forward = moe_forward MixtralSparseMoeBlock.forward = moe_forward