From a798ba16594a50940543542c8fb2d5d970bc20e8 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Sun, 28 May 2023 12:28:37 -0400 Subject: [PATCH] ensure libbitsandbytes*.so gets included with wheel --- docker/Dockerfile-base | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/docker/Dockerfile-base b/docker/Dockerfile-base index b775808bf..d32e2a3b5 100644 --- a/docker/Dockerfile-base +++ b/docker/Dockerfile-base @@ -76,9 +76,10 @@ RUN git clone https://github.com/NVIDIA/apex # `MAX_JOBS=1` disables parallel building to avoid cpu memory OOM when building image on GitHub Action (standard) runners RUN cd apex && MAX_JOBS=1 python3 -m pip install --global-option="--cpp_ext" --global-option="--cuda_ext" --no-cache -v --disable-pip-version-check . -RUN mkdir /workspace/wheels +RUN mkdir -p /workspace/wheels/bitsandbytes COPY --from=deepspeed-builder /workspace/DeepSpeed/dist/deepspeed-*.whl wheels COPY --from=bnb-builder /workspace/bitsandbytes/dist/bitsandbytes-*.whl wheels +COPY --from=bnb-builder /workspace/bitsandbytes/bitsandbytes/libbitsandbytes*.so wheels/bitsandbytes COPY --from=flash-attn-builder /workspace/flash-attention/dist/flash_attn-*.whl wheels COPY --from=flash-attn-builder /workspace/flash-attention/csrc/fused_dense_lib/dist/fused_dense_lib-*.whl wheels COPY --from=flash-attn-builder /workspace/flash-attention/csrc/xentropy/dist/xentropy_cuda_lib-*.whl wheels