fix: qwen3_vl attention config (#3216)
This commit is contained in:
@@ -134,6 +134,11 @@ def get_attention_cls_from_config(cfg: DictDefault) -> Type[nn.Module]:
|
|||||||
|
|
||||||
return Qwen2Attention
|
return Qwen2Attention
|
||||||
|
|
||||||
|
if model_type == "qwen3_vl":
|
||||||
|
from transformers.models.qwen3_vl.modeling_qwen3_vl import Qwen3VLTextAttention
|
||||||
|
|
||||||
|
return Qwen3VLTextAttention
|
||||||
|
|
||||||
if model_type == "mllama":
|
if model_type == "mllama":
|
||||||
from transformers.models.mllama.modeling_mllama import MllamaTextSelfAttention
|
from transformers.models.mllama.modeling_mllama import MllamaTextSelfAttention
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user