Correct name of MixtralBlockSparseTop2MLP (L -> l) (#1667)

This commit is contained in:
Seungduk Kim
2024-05-29 07:10:29 +09:00
committed by GitHub
parent 6a5a725f10
commit 65db903714

View File

@@ -42,9 +42,9 @@ def patch_mixtral_moe_forward_zero3() -> None:
return final_hidden_states, router_logits
from transformers.models.mixtral.modeling_mixtral import (
MixtralBLockSparseTop2MLP,
MixtralBlockSparseTop2MLP,
MixtralSparseMoeBlock,
)
MixtralBLockSparseTop2MLP.forward = mlp_forward
MixtralBlockSparseTop2MLP.forward = mlp_forward
MixtralSparseMoeBlock.forward = moe_forward