beta support for multipack with gemmoe: (#1402)

This commit is contained in:
Wing Lian
2024-03-14 15:52:23 -04:00
committed by GitHub
parent 6366b0c212
commit 8df7b888ff
2 changed files with 18 additions and 2 deletions

View File

@@ -429,7 +429,7 @@ def load_model(
and cfg.flash_attention
and cfg.sample_packing
):
patch_for_multipack(cfg.model_config_type)
patch_for_multipack(cfg.model_config_type, model_name=cfg.base_model)
elif cfg.is_llama_derived_model:
# Modify all llama derived models in one block