From c3b61f1543b918e493fbfbe37c7decf17638f429 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Mon, 20 Oct 2025 14:17:45 -0400 Subject: [PATCH 1/3] add torch 2.9.0 to ci --- .github/workflows/tests.yml | 30 ++++++++++++++++++------------ 1 file changed, 18 insertions(+), 12 deletions(-) diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 8f368b5170..6fa0291769 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -55,7 +55,7 @@ jobs: fail-fast: false matrix: python_version: ["3.11"] - pytorch_version: ["2.7.1", "2.8.0"] + pytorch_version: ["2.7.1", "2.8.0", "2.9.0"] timeout-minutes: 20 steps: @@ -130,7 +130,7 @@ jobs: fail-fast: false matrix: python_version: ["3.11"] - pytorch_version: ["2.7.1", "2.8.0"] + pytorch_version: ["2.7.1", "2.8.0", "2.9.0"] timeout-minutes: 20 steps: @@ -231,19 +231,25 @@ jobs: fail-fast: false matrix: include: - - cuda: 126 - cuda_version: 12.6.3 - python_version: "3.11" - pytorch: 2.7.1 - num_gpus: 1 - axolotl_extras: - - cuda: 126 - cuda_version: 12.6.3 + - cuda: 128 + cuda_version: 12.8.1 python_version: "3.11" - pytorch: 2.7.1 + pytorch: 2.9.0 num_gpus: 1 axolotl_extras: - dockerfile: "Dockerfile-uv.jinja" +# - cuda: 126 +# cuda_version: 12.6.3 +# python_version: "3.11" +# pytorch: 2.7.1 +# num_gpus: 1 +# axolotl_extras: +# - cuda: 126 +# cuda_version: 12.6.3 +# python_version: "3.11" +# pytorch: 2.7.1 +# num_gpus: 1 +# axolotl_extras: +# dockerfile: "Dockerfile-uv.jinja" steps: - name: Checkout uses: actions/checkout@v4 From 569b674e1e0896d9527a4665d39bffbf7258b233 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Mon, 20 Oct 2025 20:03:36 -0400 Subject: [PATCH 2/3] handle xformers for 2.9.0 --- setup.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/setup.py b/setup.py index 9e3de48b53..6f96db83fb 100644 --- a/setup.py +++ b/setup.py @@ -62,7 +62,9 @@ def parse_requirements(extras_require_map): else: raise ValueError("Invalid version format") - if (major, minor) >= (2, 8): + if (major, minor) >= (2, 9): + _install_requires.pop(_install_requires.index(xformers_version)) + elif (major, minor) >= (2, 8): pass elif (major, minor) >= (2, 7): _install_requires.pop(_install_requires.index(xformers_version)) From 5b8bd868a61c74aca22378700dab18e6669a7094 Mon Sep 17 00:00:00 2001 From: Wing Lian Date: Thu, 23 Oct 2025 10:19:45 -0700 Subject: [PATCH 3/3] enable 2.9.0 in multigpu and prioritize 2.8.0 over 2.7.1 --- .github/workflows/multi-gpu-e2e.yml | 7 +++++++ .github/workflows/tests.yml | 32 ++++++++++++++--------------- 2 files changed, 23 insertions(+), 16 deletions(-) diff --git a/.github/workflows/multi-gpu-e2e.yml b/.github/workflows/multi-gpu-e2e.yml index 6a92de352c..1682beb31a 100644 --- a/.github/workflows/multi-gpu-e2e.yml +++ b/.github/workflows/multi-gpu-e2e.yml @@ -40,6 +40,13 @@ jobs: axolotl_extras: fbgemm-gpu num_gpus: 2 nightly_build: "true" + - cuda: 128 + cuda_version: 12.8.1 + python_version: "3.11" + pytorch: 2.9.0 + axolotl_extras: fbgemm-gpu + num_gpus: 2 + nightly_build: "true" runs-on: [self-hosted, modal] timeout-minutes: 120 steps: diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml index 6fa0291769..e26825757a 100644 --- a/.github/workflows/tests.yml +++ b/.github/workflows/tests.yml @@ -234,22 +234,10 @@ jobs: - cuda: 128 cuda_version: 12.8.1 python_version: "3.11" - pytorch: 2.9.0 + pytorch: 2.8.0 num_gpus: 1 axolotl_extras: -# - cuda: 126 -# cuda_version: 12.6.3 -# python_version: "3.11" -# pytorch: 2.7.1 -# num_gpus: 1 -# axolotl_extras: -# - cuda: 126 -# cuda_version: 12.6.3 -# python_version: "3.11" -# pytorch: 2.7.1 -# num_gpus: 1 -# axolotl_extras: -# dockerfile: "Dockerfile-uv.jinja" + dockerfile: "Dockerfile-uv.jinja" steps: - name: Checkout uses: actions/checkout@v4 @@ -292,12 +280,18 @@ jobs: fail-fast: false matrix: include: - - cuda: 128 - cuda_version: 12.8.1 + - cuda: 126 + cuda_version: 12.6.3 python_version: "3.11" pytorch: 2.7.1 num_gpus: 1 axolotl_extras: +# - cuda: 128 +# cuda_version: 12.8.1 +# python_version: "3.11" +# pytorch: 2.7.1 +# num_gpus: 1 +# axolotl_extras: - cuda: 128 cuda_version: 12.8.1 python_version: "3.11" @@ -305,6 +299,12 @@ jobs: num_gpus: 1 gpu_type: "B200" axolotl_extras: fbgemm-gpu + - cuda: 128 + cuda_version: 12.8.1 + python_version: "3.11" + pytorch: 2.9.0 + num_gpus: 1 + axolotl_extras: steps: - name: Checkout uses: actions/checkout@v4