Correct name of MixtralBlockSparseTop2MLP (L -> l) (#1667)
This commit is contained in:
@@ -42,9 +42,9 @@ def patch_mixtral_moe_forward_zero3() -> None:
|
|||||||
return final_hidden_states, router_logits
|
return final_hidden_states, router_logits
|
||||||
|
|
||||||
from transformers.models.mixtral.modeling_mixtral import (
|
from transformers.models.mixtral.modeling_mixtral import (
|
||||||
MixtralBLockSparseTop2MLP,
|
MixtralBlockSparseTop2MLP,
|
||||||
MixtralSparseMoeBlock,
|
MixtralSparseMoeBlock,
|
||||||
)
|
)
|
||||||
|
|
||||||
MixtralBLockSparseTop2MLP.forward = mlp_forward
|
MixtralBlockSparseTop2MLP.forward = mlp_forward
|
||||||
MixtralSparseMoeBlock.forward = moe_forward
|
MixtralSparseMoeBlock.forward = moe_forward
|
||||||
|
|||||||
Reference in New Issue
Block a user