From 4de4b4089fbc43e04c696c10c1ac51eebf2c6a99 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Thu, 20 Jun 2024 10:02:55 -0400 Subject: [PATCH] add support for multipack for deepseek_v2 (#1712) --- src/axolotl/monkeypatch/multipack.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/axolotl/monkeypatch/multipack.py b/src/axolotl/monkeypatch/multipack.py index c1eb3127d..7f6296bb6 100644 --- a/src/axolotl/monkeypatch/multipack.py +++ b/src/axolotl/monkeypatch/multipack.py @@ -18,6 +18,7 @@ SUPPORTED_MULTIPACK_MODEL_TYPES = [ "gemma", "gemmoe", "starcoder2", + "deepseek_v2", ] @@ -56,6 +57,8 @@ def patch_for_multipack(model_type, model_name=None): patch_remote(model_name, ".configuration_gemmoe", ".modeling_gemmoe") elif model_type == "jamba": patch_remote(model_name, ".configuration_jamba", ".modeling_jamba") + elif model_type == "deepseek_v2": + patch_remote(model_name, ".configuration_deepseek", ".modeling_deepseek") def patch_remote(model_name, config_name, modeling_name):