diff --git a/.github/workflows/more-tests.yml b/.github/workflows/more-tests.yml index dedbcc982..4100b2572 100644 --- a/.github/workflows/more-tests.yml +++ b/.github/workflows/more-tests.yml @@ -16,7 +16,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | set -xeou pipefail @@ -95,7 +95,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | set -xeou pipefail diff --git a/.github/workflows/periodic.yml b/.github/workflows/periodic.yml index 2e264e6cf..127ad5b50 100644 --- a/.github/workflows/periodic.yml +++ b/.github/workflows/periodic.yml @@ -122,7 +122,7 @@ jobs: secrets-env: "HF_TOKEN_PERIODIC" runner: ${{ matrix.runner }} gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" script: | echo "::group::Print machine info" nvidia-smi diff --git a/.github/workflows/pull.yml b/.github/workflows/pull.yml index e44d9d037..b2277df51 100644 --- a/.github/workflows/pull.yml +++ b/.github/workflows/pull.yml @@ -227,7 +227,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" script: | echo "::group::Print machine info" nvidia-smi @@ -265,7 +265,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -314,7 +314,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" script: | echo "::group::Print machine info" nvidia-smi @@ -363,7 +363,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" script: | echo "::group::Print machine info" nvidia-smi @@ -413,7 +413,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" script: | echo "::group::Print machine info" nvidia-smi diff --git a/.github/workflows/run-readme-periodic.yml b/.github/workflows/run-readme-periodic.yml index 2c49a975f..51859c75e 100644 --- a/.github/workflows/run-readme-periodic.yml +++ b/.github/workflows/run-readme-periodic.yml @@ -19,7 +19,7 @@ jobs: runner: linux.g5.4xlarge.nvidia.gpu secrets-env: "HF_TOKEN_PERIODIC" gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -50,7 +50,7 @@ jobs: runner: linux.g5.4xlarge.nvidia.gpu secrets: inherit gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -81,7 +81,7 @@ jobs: runner: linux.g5.4xlarge.nvidia.gpu secrets-env: "HF_TOKEN_PERIODIC" gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" diff --git a/.github/workflows/run-readme-pr.yml b/.github/workflows/run-readme-pr.yml index fa786494c..49738d293 100644 --- a/.github/workflows/run-readme-pr.yml +++ b/.github/workflows/run-readme-pr.yml @@ -16,7 +16,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info and try install pip and/or pip3" @@ -39,7 +39,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info and try install pip and/or pip3" @@ -62,7 +62,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info and try install pip and/or pip3" @@ -86,7 +86,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info and try install pip and/or pip3" @@ -104,7 +104,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -127,7 +127,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -151,7 +151,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -175,7 +175,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -198,7 +198,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -220,7 +220,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -242,7 +242,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -264,7 +264,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -281,7 +281,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -309,7 +309,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" @@ -331,7 +331,7 @@ jobs: with: runner: linux.g5.4xlarge.nvidia.gpu gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" diff --git a/.github/workflows/runner-cuda-dtype.yml b/.github/workflows/runner-cuda-dtype.yml index 0b4597942..1d50f0064 100644 --- a/.github/workflows/runner-cuda-dtype.yml +++ b/.github/workflows/runner-cuda-dtype.yml @@ -17,7 +17,7 @@ jobs: runner: linux.g5.4xlarge.nvidia.gpu secrets-env: "HF_TOKEN_PERIODIC" gpu-arch-type: cuda - gpu-arch-version: "12.4" + gpu-arch-version: "12.6" timeout: 60 script: | echo "::group::Print machine info" diff --git a/install/install_requirements.sh b/install/install_requirements.sh index 0e58409c8..76e9fe94c 100755 --- a/install/install_requirements.sh +++ b/install/install_requirements.sh @@ -64,7 +64,7 @@ TUNE_NIGHTLY_VERSION=dev20250131 # with cuda for faster execution on cuda GPUs. if [[ -x "$(command -v nvidia-smi)" ]]; then - TORCH_NIGHTLY_URL="https://download.pytorch.org/whl/nightly/cu124" + TORCH_NIGHTLY_URL="https://download.pytorch.org/whl/nightly/cu126" elif [[ -x "$(command -v rocminfo)" ]]; then TORCH_NIGHTLY_URL="https://download.pytorch.org/whl/nightly/rocm6.2"