py310, fix cuda arg in deepspeed
This commit is contained in:
10
.github/workflows/base.yml
vendored
10
.github/workflows/base.yml
vendored
@@ -16,12 +16,19 @@ jobs:
|
|||||||
include:
|
include:
|
||||||
- cuda: "118"
|
- cuda: "118"
|
||||||
cuda_version: 11.8.0
|
cuda_version: 11.8.0
|
||||||
|
python_version: 3.9
|
||||||
|
axolotl_extras:
|
||||||
|
- cuda: "118"
|
||||||
|
cuda_version: 11.8.0
|
||||||
|
python_version: 3.10
|
||||||
axolotl_extras:
|
axolotl_extras:
|
||||||
- cuda: "117"
|
- cuda: "117"
|
||||||
cuda_version: 11.7.0
|
cuda_version: 11.7.0
|
||||||
|
python_version: 3.9
|
||||||
pytorch: 1.13.1
|
pytorch: 1.13.1
|
||||||
axolotl_extras:
|
axolotl_extras:
|
||||||
- cuda: "118"
|
- cuda: "118"
|
||||||
|
python_version: 3.9
|
||||||
cuda_version: 11.8.0
|
cuda_version: 11.8.0
|
||||||
pytorch: 2.0.0
|
pytorch: 2.0.0
|
||||||
axolotl_extras: gptq
|
axolotl_extras: gptq
|
||||||
@@ -46,12 +53,13 @@ jobs:
|
|||||||
context: .
|
context: .
|
||||||
file: ./docker/Dockerfile-base
|
file: ./docker/Dockerfile-base
|
||||||
push: ${{ github.event_name != 'pull_request' }}
|
push: ${{ github.event_name != 'pull_request' }}
|
||||||
tags: ${{ steps.metadata.outputs.tags }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
tags: ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
||||||
labels: ${{ steps.metadata.outputs.labels }}
|
labels: ${{ steps.metadata.outputs.labels }}
|
||||||
cache-from: type=gha
|
cache-from: type=gha
|
||||||
cache-to: type=gha,mode=max
|
cache-to: type=gha,mode=max
|
||||||
build-args: |
|
build-args: |
|
||||||
CUDA_VERSION=${{ matrix.cuda_version }}
|
CUDA_VERSION=${{ matrix.cuda_version }}
|
||||||
CUDA=${{ matrix.cuda }}
|
CUDA=${{ matrix.cuda }}
|
||||||
|
PYTHON_VERSION=${{ matrix.python_version }}
|
||||||
PYTORCH_VERSION=${{ matrix.pytorch }}
|
PYTORCH_VERSION=${{ matrix.pytorch }}
|
||||||
AXOLOTL_EXTRAS=${{ matrix.axolotl_extras }}
|
AXOLOTL_EXTRAS=${{ matrix.axolotl_extras }}
|
||||||
|
|||||||
@@ -52,6 +52,8 @@ RUN git clone https://github.com/HazyResearch/flash-attention.git && \
|
|||||||
|
|
||||||
FROM base-builder AS deepspeed-builder
|
FROM base-builder AS deepspeed-builder
|
||||||
|
|
||||||
|
ARG TORCH_CUDA_ARCH_LIST="7.0 7.5 8.0 8.6+PTX"
|
||||||
|
|
||||||
WORKDIR /workspace
|
WORKDIR /workspace
|
||||||
|
|
||||||
RUN git clone https://github.com/microsoft/DeepSpeed.git && \
|
RUN git clone https://github.com/microsoft/DeepSpeed.git && \
|
||||||
|
|||||||
Reference in New Issue
Block a user