bump deepspeed for fix for grad norm compute putting tensors on different devices (#1699)

This commit is contained in:
Wing Lian
2024-06-09 17:13:28 -04:00
committed by GitHub
parent 18cabc0c46
commit 851ccb1237
2 changed files with 2 additions and 2 deletions

View File

@@ -83,7 +83,7 @@ setup(
"fused-dense-lib @ git+https://github.com/Dao-AILab/flash-attention@v2.5.8#subdirectory=csrc/fused_dense_lib",
],
"deepspeed": [
"deepspeed==0.14.2",
"deepspeed @ git+https://github.com/microsoft/DeepSpeed.git@bc48371c5e1fb8fd70fc79285e66201dbb65679b",
"deepspeed-kernels",
],
"mamba-ssm": [