diff --git a/.github/workflows/base.yml b/.github/workflows/base.yml index 6078b2bae..61495e677 100644 --- a/.github/workflows/base.yml +++ b/.github/workflows/base.yml @@ -16,12 +16,19 @@ jobs: include: - cuda: "118" cuda_version: 11.8.0 + python_version: 3.9 + axolotl_extras: + - cuda: "118" + cuda_version: 11.8.0 + python_version: 3.10 axolotl_extras: - cuda: "117" cuda_version: 11.7.0 + python_version: 3.9 pytorch: 1.13.1 axolotl_extras: - cuda: "118" + python_version: 3.9 cuda_version: 11.8.0 pytorch: 2.0.0 axolotl_extras: gptq @@ -46,12 +53,13 @@ jobs: context: . file: ./docker/Dockerfile-base push: ${{ github.event_name != 'pull_request' }} - tags: ${{ steps.metadata.outputs.tags }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }} + tags: ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }} labels: ${{ steps.metadata.outputs.labels }} cache-from: type=gha cache-to: type=gha,mode=max build-args: | CUDA_VERSION=${{ matrix.cuda_version }} CUDA=${{ matrix.cuda }} + PYTHON_VERSION=${{ matrix.python_version }} PYTORCH_VERSION=${{ matrix.pytorch }} AXOLOTL_EXTRAS=${{ matrix.axolotl_extras }} diff --git a/docker/Dockerfile-base b/docker/Dockerfile-base index 710d1c1c2..2728f3a72 100644 --- a/docker/Dockerfile-base +++ b/docker/Dockerfile-base @@ -52,6 +52,8 @@ RUN git clone https://github.com/HazyResearch/flash-attention.git && \ FROM base-builder AS deepspeed-builder +ARG TORCH_CUDA_ARCH_LIST="7.0 7.5 8.0 8.6+PTX" + WORKDIR /workspace RUN git clone https://github.com/microsoft/DeepSpeed.git && \