diff --git a/tests/e2e/multigpu/test_llama.py b/tests/e2e/multigpu/test_llama.py index 3bacac821..1ff795bd6 100644 --- a/tests/e2e/multigpu/test_llama.py +++ b/tests/e2e/multigpu/test_llama.py @@ -621,12 +621,6 @@ class TestMultiGPULlama: temp_dir + "/runs", "train/train_loss", 2.3, "Train Loss is too high" ) - # TODO: remove skip once deepspeed regression is fixed - # see https://github.com/huggingface/transformers/pull/37324 - @pytest.mark.skipif( - transformers_version_eq("4.51.0"), - reason="zero3 is not supported with transformers==4.51.0", - ) @pytest.mark.parametrize( "gradient_accumulation_steps", [1, 2],