diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 7ff712757..29cd2556d 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -20,12 +20,11 @@ jobs: python_version: "3.11" pytorch: 2.5.1 axolotl_extras: - - cuda: 124 - cuda_version: 12.4.1 + - cuda: 126 + cuda_version: 12.6.3 python_version: "3.11" pytorch: 2.6.0 axolotl_extras: vllm - is_latest: true - cuda: 126 cuda_version: 12.6.3 python_version: "3.11" @@ -88,8 +87,8 @@ jobs: python_version: "3.11" pytorch: 2.5.1 axolotl_extras: - - cuda: 124 - cuda_version: 12.4.1 + - cuda: 126 + cuda_version: 12.6.3 python_version: "3.11" pytorch: 2.6.0 axolotl_extras: @@ -146,8 +145,8 @@ jobs: strategy: matrix: include: - - cuda: 124 - cuda_version: 12.4.1 + - cuda: 126 + cuda_version: 12.6.3 python_version: "3.11" pytorch: 2.6.0 axolotl_extras: diff --git a/.github/workflows/multi-gpu-e2e.yml b/.github/workflows/multi-gpu-e2e.yml index deea0ed29..09d9663a9 100644 --- a/.github/workflows/multi-gpu-e2e.yml +++ b/.github/workflows/multi-gpu-e2e.yml @@ -26,11 +26,11 @@ jobs: fail-fast: false matrix: include: - - cuda: 124 - cuda_version: 12.4.1 + - cuda: 126 + cuda_version: 12.6.3 python_version: "3.11" pytorch: 2.6.0 - axolotl_extras: vllm + axolotl_extras: num_gpus: 2 nightly_build: "true" - cuda: 124 diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index bb865e98d..b489e27b8 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -195,12 +195,12 @@ jobs: fail-fast: false matrix: include: - - cuda: 124 - cuda_version: 12.4.1 + - cuda: 126 + cuda_version: 12.6.3 python_version: "3.11" pytorch: 2.6.0 num_gpus: 1 - axolotl_extras: vllm + axolotl_extras: - cuda: 126 cuda_version: 12.6.3 python_version: "3.11" @@ -247,8 +247,8 @@ jobs: fail-fast: false matrix: include: - - cuda: 124 - cuda_version: 12.4.1 + - cuda: 126 + cuda_version: 12.6.3 python_version: "3.11" pytorch: 2.6.0 num_gpus: 1 @@ -311,7 +311,7 @@ jobs: python_version: "3.11" pytorch: 2.6.0 num_gpus: 1 - axolotl_extras: vllm + axolotl_extras: steps: - name: Checkout uses: actions/checkout@v4 diff --git a/docker/Dockerfile-base b/docker/Dockerfile-base index cc9ca2f2d..52201f276 100644 --- a/docker/Dockerfile-base +++ b/docker/Dockerfile-base @@ -37,7 +37,3 @@ RUN git lfs install --skip-repo && \ pip3 install awscli && \ # The base image ships with `pydantic==1.8.2` which is not working pip3 install -U --no-cache-dir pydantic==1.10.10 - -RUN if [ "$PYTORCH_VERSION" = "2.7.1" ] ; then \ - pip3 install flash-attn==2.7.4.post1; \ - fi diff --git a/docker/Dockerfile-uv-base b/docker/Dockerfile-uv-base index c612278ae..4b08e55f8 100644 --- a/docker/Dockerfile-uv-base +++ b/docker/Dockerfile-uv-base @@ -34,7 +34,3 @@ RUN uv pip install packaging setuptools wheel psutil \ && uv pip install --no-build-isolation "causal_conv1d @ git+https://github.com/Dao-AILab/causal-conv1d.git@main" \ && uv pip install "mamba_ssm @ git+https://github.com/state-spaces/mamba.git@main" \ && uv pip install awscli pydantic - -RUN if [ "$PYTORCH_VERSION" = "2.7.1" ] ; then \ - uv pip install --no-build-isolation flash-attn==2.7.4.post1; \ - fi diff --git a/setup.py b/setup.py index 08c39c71c..212625bdd 100644 --- a/setup.py +++ b/setup.py @@ -111,9 +111,9 @@ def get_package_version(): extras_require = { - "flash-attn": ["flash-attn==2.7.4.post1"], + "flash-attn": ["flash-attn==2.8.0.post2"], "ring-flash-attn": [ - "flash-attn==2.7.4.post1", + "flash-attn==2.8.0.post2", "ring-flash-attn>=0.1.4", "yunchang==0.6.0", ],