add support for multipack for deepseek_v2 (#1712)

This commit is contained in:
Wing Lian
2024-06-20 10:02:55 -04:00
committed by GitHub
parent 3f1f5e3312
commit 4de4b4089f

View File

@@ -18,6 +18,7 @@ SUPPORTED_MULTIPACK_MODEL_TYPES = [
"gemma",
"gemmoe",
"starcoder2",
"deepseek_v2",
]
@@ -56,6 +57,8 @@ def patch_for_multipack(model_type, model_name=None):
patch_remote(model_name, ".configuration_gemmoe", ".modeling_gemmoe")
elif model_type == "jamba":
patch_remote(model_name, ".configuration_jamba", ".modeling_jamba")
elif model_type == "deepseek_v2":
patch_remote(model_name, ".configuration_deepseek", ".modeling_deepseek")
def patch_remote(model_name, config_name, modeling_name):