@@ -16,22 +16,23 @@ jobs:
1616 matrix :
1717 runner : ${{ fromJson(inputs.matrix) }}
1818 include :
19- - image : rocm/pytorch:rocm6.2.2_ubuntu22. 04_py3.10_pytorch_2.5.1_asan
19+ - image : rocm/pytorch:rocm7.0_ubuntu22. 04_py3.10_pytorch_release_2.8.0
2020 runner : ["self-hosted", "gfx90a"]
2121 # Cache save/restore is on the host machine at directory /home/runner/.triton, while in the docker
2222 # container expect it at /github/home/.triton. So map here to make sure visible in docker.
2323 options : >-
2424 --device=/dev/kfd --device=/dev/dri --security-opt seccomp=unconfined --group-add video --user root
2525 --volume /home/runner/.triton:/github/home/.triton
26- - image : rocm/pytorch:rocm6.2.2_ubuntu22. 04_py3.10_pytorch_2.5.1_asan
26+ - image : rocm/pytorch:rocm7.0_ubuntu22. 04_py3.10_pytorch_release_2.8.0
2727 runner : ["amd-gfx942"]
2828 # We add --env-file to pull in HIP_VISIBLE_DEVICES and ROCR_VISIBLE_DEVICES definition for GPU isolation.
2929 options : >-
3030 --device=/dev/kfd --device=/dev/dri --security-opt seccomp=unconfined --group-add video --user root
3131 --env-file /etc/podinfo/gha-gpu-isolation-settings
3232 --volume /home/runner/.triton:/github/home/.triton
33- - image : rocm/7.0-preview :rocm7.0_preview_ubuntu22.04_llama2_70b_training_mlperf_mi35X_prealpha
33+ - image : rocm/pytorch :rocm7.0_ubuntu22.04_py3.10_pytorch_release_2.8.0
3434 runner : ["amd-gfx950"]
35+ # We add --env-file to pull in HIP_VISIBLE_DEVICES and ROCR_VISIBLE_DEVICES definition for GPU isolation.
3536 options : >-
3637 --device=/dev/kfd --device=/dev/dri --security-opt seccomp=unconfined --group-add video --user root
3738 --env-file /etc/podinfo/gha-gpu-isolation-settings
@@ -81,14 +82,16 @@ jobs:
8182 ~/.triton/nvidia
8283 ~/.triton/json
8384 key : ${{ runner.os }}-${{ runner.arch }}-llvm-${{ steps.cache-key.outputs.llvm }}-nvidia-${{ steps.cache-key.outputs.nvidia }}-json-${{ steps.cache-key.outputs.json }}
85+ - name : Install dependencies
86+ run : apt-get install -y clang lld ccache
8487 - name : Inspect cache directories
8588 run : |
8689 mkdir -p ~/.triton
8790 du -h -d 1 ~/.triton
8891
8992 mkdir -p ~/.ccache
9093 du -h -d 1 ~/.ccache
91- - name : Update compiler to clang
94+ - name : Update compiler to Clang
9295 run : |
9396 export CC=/usr/bin/clang
9497 export CXX=/usr/bin/clang++
@@ -98,19 +101,15 @@ jobs:
98101 echo "PATH is '$PATH'"
99102 pip uninstall -y triton pytorch-triton-rocm
100103
101- if [ "${{ matrix.runner[0] }}" != "amd-gfx950" ]; then
102- ccache --zero-stats
103- fi
104-
104+ ccache --zero-stats
105105 make dev-install
106- - name : CCache Stats
107- if : ${{ matrix.runner[0] != 'amd-gfx950' }}
106+ - name : Print ccache stats
108107 run : ccache --print-stats
109108 - name : Run lit tests
110109 run : make test-lit
111110 - name : Run C++ unittests
112111 run : make test-cpp
113- - name : Run python tests on AMD
112+ - name : Run Python tests on AMD
114113 run : |
115114 INSTRUMENTATION_LIB_DIR="${GITHUB_WORKSPACE}/python/triton/instrumentation"
116115 if [ ! -d "${INSTRUMENTATION_LIB_DIR}" ]; then
0 commit comments