[CI] Upgrade CI envs to torch~=2.7.0 (#450)

zhiyuan1i · web-flow · commit c1ac8d0c403a · 2025-06-15T20:02:18.000+10:00
diff --git a/.github/workflows/intel-a770.yml b/.github/workflows/intel-a770.yml
@@ -62,10 +62,11 @@ jobs:
       - name: Setup python
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
         run: |
+          pip install -U uv
           pip uninstall -y flash-linear-attention
-          pip install -U pytest setuptools wheel ninja
-          pip install -U torch pytorch-triton-xpu --index-url https://download.pytorch.org/whl/xpu
-          pip install --no-use-pep517 .
+          uv pip install -U pytest setuptools wheel ninja
+          uv pip install -U torch~=2.7.0 pytorch-triton-xpu --index-url https://download.pytorch.org/whl/xpu
+          pip install .
 
       - name: Check GPU status
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
@@ -83,15 +84,13 @@ jobs:
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run pytest on test files
-        continue-on-error: true
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run pytest on varlen test files
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
-        continue-on-error: true
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }} || \
@@ -105,14 +104,12 @@ jobs:
 
       # skip full pytest because it takes too long
       - name: Run full pytest on test files
-        continue-on-error: true
         if: false && github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run full pytest on varlen test files
-        continue-on-error: true
         if: false && github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
diff --git a/.github/workflows/nvidia-4090.yml b/.github/workflows/nvidia-4090.yml
@@ -67,7 +67,12 @@ jobs:
           # pip install -U pytest setuptools wheel ninja torch triton
           # MAX_JOBS=4 pip install -U flash-attn --no-build-isolation
           # pip install git+https://github.com/Dao-AILab/causal-conv1d.git --no-build-isolation
-          pip install --no-use-pep517 .
+          pip install -U uv
+          pip uninstall -y flash-linear-attention
+          uv pip install git+https://github.com/Dao-AILab/causal-conv1d.git -U --no-cache-dir --no-build-isolation
+          uv pip install flash-attn -U --no-cache-dir --no-build-isolation
+          uv pip install torch~=2.7.0 triton pytest setuptools wheel ninja -U --index-url https://download.pytorch.org/whl/cu128
+          pip install .
 
       - name: Check GPU status
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
@@ -85,15 +90,13 @@ jobs:
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run pytest on test files
-        continue-on-error: true
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run pytest on varlen test files
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
-        continue-on-error: true
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }} || \
@@ -106,14 +109,12 @@ jobs:
             pytest tests/
 
       - name: Run full pytest on test files
-        continue-on-error: true
         if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run full pytest on varlen test files
-        continue-on-error: true
         if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
diff --git a/.github/workflows/nvidia-a100.yml b/.github/workflows/nvidia-a100.yml
@@ -0,0 +1,121 @@
+name: nvidia-a100-ci
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
+  cancel-in-progress: ${{ github.event_name == 'pull_request' }}
+
+on:
+  pull_request:
+    branches: [ '*' ]
+    types: [opened, synchronize, reopened, closed]
+  push:
+    branches:
+      - main
+    tags:
+      - '*'
+
+jobs:
+  test:
+    if: github.event_name != 'pull_request' || github.event.action != 'closed'
+    runs-on: 'nvidia-a100'
+    env:
+      FLA_CI_ENV: 1
+    steps:
+      - name: Check out repo
+        uses: actions/checkout@v4
+
+      - name: Check skip keyword in LATEST commit (Push only)
+        id: check_skip
+        run: |
+          if [ "${{ github.event_name }}" = "push" ] && ! [[ "${{ github.ref }}" =~ ^refs/tags/ ]]; then
+            COMMIT_MSG=$(jq -r '.head_commit.message' <<< '${{ toJSON(github.event) }}')
+            echo "Latest commit message: $COMMIT_MSG"
+            if echo "$COMMIT_MSG" | grep -qF "[skip test]"; then
+              echo "::notice::Tests skipped by commit message"
+              echo "skip_tests=true" >> $GITHUB_OUTPUT
+            else
+              echo "skip_tests=false" >> $GITHUB_OUTPUT
+            fi
+          else
+            echo "skip_tests=false" >> $GITHUB_OUTPUT
+          fi
+
+      - name: Get changed files
+        if: |
+          (github.event_name == 'pull_request' ||
+          (github.event_name == 'push' && !startsWith(github.ref, 'refs/tags/'))) &&
+          (steps.check_skip.outputs.skip_tests != 'true' || github.event_name != 'push')
+        id: changed-files
+        uses: tj-actions/changed-files@v46.0.3
+
+      - name: Find dependent test files
+        if: |
+          (github.event_name == 'pull_request' ||
+          (github.event_name == 'push' && !startsWith(github.ref, 'refs/tags/'))) &&
+          (steps.check_skip.outputs.skip_tests != 'true' || github.event_name != 'push')
+        id: find-dependent-tests
+        run: |
+          # Run the Python script to find dependent test files
+          TEST_FILES=$(python scripts/find_dependent_tests.py "${{ steps.changed-files.outputs.all_changed_files }}")
+          echo "test_files=$TEST_FILES" >> $GITHUB_OUTPUT
+
+      - name: Setup python
+        if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          # Installed by hand to avoid issues with pip
+          # pip install -U pytest setuptools wheel ninja torch triton
+          # MAX_JOBS=4 pip install -U flash-attn --no-build-isolation
+          # pip install git+https://github.com/Dao-AILab/causal-conv1d.git --no-build-isolation
+          pip install -U uv
+          pip uninstall -y flash-linear-attention
+          uv pip install git+https://github.com/Dao-AILab/causal-conv1d.git -U --no-cache-dir --no-build-isolation
+          uv pip install flash-attn -U --no-cache-dir --no-build-isolation
+          uv pip install torch~=2.7.0 triton pytest setuptools wheel ninja -U --index-url https://download.pytorch.org/whl/cu128
+          pip install .
+
+      - name: Check GPU status
+        if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          python scripts/check_gpu.py
+          if [ $? -ne 0 ]; then
+            echo "GPU is occupied. Stopping the workflow."
+            exit 1
+          fi
+
+      - name: Test compiling on changed test files
+        if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          FLA_COMPILER_MODE=1 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
+            pytest ${{ steps.find-dependent-tests.outputs.test_files }}
+
+      - name: Run pytest on test files
+        if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
+            pytest ${{ steps.find-dependent-tests.outputs.test_files }}
+
+      - name: Run pytest on varlen test files
+        if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
+            pytest ${{ steps.find-dependent-tests.outputs.test_files }} || \
+            echo "Varlen tests failed (non-critical)"
+
+      - name: Test full compiling on all test files
+        if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          FLA_COMPILER_MODE=1 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
+            pytest tests/
+
+      - name: Run full pytest on test files
+        if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
+            pytest ${{ steps.find-dependent-tests.outputs.test_files }}
+
+      - name: Run full pytest on varlen test files
+        if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
+        run: |
+          FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
+            pytest ${{ steps.find-dependent-tests.outputs.test_files }} || \
+            echo "Varlen tests failed (non-critical)"
diff --git a/.github/workflows/nvidia-h100.yml b/.github/workflows/nvidia-h100.yml
@@ -62,12 +62,16 @@ jobs:
       - name: Setup python
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
         run: |
-          pip uninstall -y flash-linear-attention
           # Installed by hand to avoid issues with pip
           # pip install -U pytest setuptools wheel ninja torch triton
           # MAX_JOBS=4 pip install -U flash-attn --no-build-isolation
           # pip install git+https://github.com/Dao-AILab/causal-conv1d.git --no-build-isolation
-          pip install --no-use-pep517 .
+          pip install -U uv
+          pip uninstall -y flash-linear-attention
+          uv pip install git+https://github.com/Dao-AILab/causal-conv1d.git -U --no-cache-dir --no-build-isolation
+          uv pip install flash-attn -U --no-cache-dir --no-build-isolation
+          uv pip install torch~=2.7.0 triton pytest setuptools wheel ninja -U --index-url https://download.pytorch.org/whl/cu128
+          pip install .
 
       - name: Check GPU status
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
@@ -85,15 +89,13 @@ jobs:
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run pytest on test files
-        continue-on-error: true
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run pytest on varlen test files
         if: steps.find-dependent-tests.outputs.test_files && steps.check_skip.outputs.skip_tests == 'false'
-        continue-on-error: true
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }} || \
@@ -106,14 +108,12 @@ jobs:
             pytest tests/
 
       - name: Run full pytest on test files
-        continue-on-error: true
         if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=1 \
             pytest ${{ steps.find-dependent-tests.outputs.test_files }}
 
       - name: Run full pytest on varlen test files
-        continue-on-error: true
         if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/') && steps.check_skip.outputs.skip_tests == 'false'
         run: |
           FLA_COMPILER_MODE=0 TRITON_PRINT_AUTOTUNING=0 SKIP_TEST_CHUNK_VARLEN=0 \
diff --git a/FAQs.md b/FAQs.md
@@ -23,7 +23,7 @@ conda create -n triton-nightly python=3.12
 conda activate triton-nightly
 
 # Install PyTorch nightly (required for Triton nightly compatibility)
-pip install -U --pre torch --index-url https://download.pytorch.org/whl/nightly/cu126
+pip install -U --pre torch --index-url https://download.pytorch.org/whl/nightly/cu128
 
 # Install Triton nightly
 pip uninstall triton pytorch-triton -y
@@ -34,8 +34,9 @@ pip install einops ninja datasets transformers numpy
 pip uninstall flash-linear-attention && pip install -U --no-use-pep517 git+https://github.com/fla-org/flash-linear-attention --no-deps
 
 # Optional: Install flash-attention
-conda install nvidia/label/cuda-12.6.3::cuda-nvcc
+conda install nvidia/label/cuda-12.8.1::cuda-nvcc
 pip install packaging psutil ninja
+pip install git+https://github.com/Dao-AILab/causal-conv1d.git --no-build-isolation
 pip install flash-attn --no-deps --no-cache-dir --no-build-isolation
 
 # Optional: Verify flash-attention installation
diff --git a/README.md b/README.md
@@ -76,7 +76,7 @@ Roughly sorted according to the timeline supported in `fla`. The recommended tra
 
 ## Installation
 
-[![nvidia-4090-ci](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-4090.yml/badge.svg?branch=main&event=push)](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-4090.yml) [![nvidia-h100-ci](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-h100.yml/badge.svg?branch=main&event=push)](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-h100.yml) [![intel-a770-ci](https://github.com/fla-org/flash-linear-attention/actions/workflows/intel-a770.yml/badge.svg?event=push)](https://github.com/fla-org/flash-linear-attention/actions/workflows/intel-a770.yml)
+[![nvidia-4090-ci](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-4090.yml/badge.svg?branch=main&event=push)](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-4090.yml) [![nvidia-a100-ci](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-a100.yml/badge.svg?branch=main)](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-a100.yml) [![nvidia-h100-ci](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-h100.yml/badge.svg?branch=main&event=push)](https://github.com/fla-org/flash-linear-attention/actions/workflows/nvidia-h100.yml) [![intel-a770-ci](https://github.com/fla-org/flash-linear-attention/actions/workflows/intel-a770.yml/badge.svg?event=push)](https://github.com/fla-org/flash-linear-attention/actions/workflows/intel-a770.yml)
 
 The following requirements should be satisfied
 - [PyTorch](https://pytorch.org/) >= 2.5
@@ -88,12 +88,12 @@ The following requirements should be satisfied
 
 You can install `fla` with pip:
 ```sh
-pip install --no-use-pep517 flash-linear-attention
+pip install flash-linear-attention
 ```
 As `fla` is actively developed now, for the latest features and updates, an alternative way is to install the package from source
 ```sh
 # uninstall `fla` first to ensure a successful upgrade
-pip uninstall flash-linear-attention && pip install -U --no-use-pep517 git+https://github.com/fla-org/flash-linear-attention
+pip uninstall flash-linear-attention && pip install -U git+https://github.com/fla-org/flash-linear-attention
 ```
 or manage `fla` with submodules
 ```sh
diff --git a/pyproject.toml b/pyproject.toml
@@ -31,7 +31,7 @@ dev = ["pytest"]
 Homepage = "https://github.com/fla-org/flash-linear-attention"
 
 [build-system]
-requires = ["setuptools>=45", "wheel", "ninja", "torch"]
+requires = ["setuptools>=45", "wheel"]
 
 [tool.isort]
 line_length = 127