Skip to content

Commit 6456fb4

Browse files
authored
Merge pull request #162 from RomeoV/master
Let torch determine correct cuda architecture
2 parents 5f4f9c5 + 37f758b commit 6456fb4

File tree

4 files changed

+4
-3
lines changed

4 files changed

+4
-3
lines changed

.github/workflows/building.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@ jobs:
7070
if: ${{ matrix.cuda-version != 'cpu' }}
7171
run: |
7272
source .github/workflows/cuda/${{ matrix.cuda-version }}-${{ runner.os }}-env.sh
73-
FORCE_CUDA=1 WITH_METIS=1 pip install -e .
73+
FORCE_CUDA=1 WITH_METIS=1 TORCH_CUDA_ARCH_LIST="5.2 6.0 6.1 7.0 7.5 8.0 8.6+PTX" pip install -e .
7474
shell:
7575
bash
7676

CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ if(WITH_CUDA)
99
enable_language(CUDA)
1010
add_definitions(-D__CUDA_NO_HALF_OPERATORS__)
1111
add_definitions(-DWITH_CUDA)
12-
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -arch=sm_35 --expt-relaxed-constexpr")
12+
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --expt-relaxed-constexpr")
1313
endif()
1414

1515
find_package(Python3 COMPONENTS Development)

conda/pytorch-sparse/meta.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@ build:
2727
script_env:
2828
- FORCE_CUDA
2929
- WITH_METIS=1
30+
- TORCH_CUDA_ARCH_LIST="5.2 6.0 6.1 7.0 7.5 8.0 8.6+PTX"
3031
preserve_egg_dir: True
3132

3233
test:

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,7 @@ def get_extensions():
6262
define_macros += [('WITH_CUDA', None)]
6363
nvcc_flags = os.getenv('NVCC_FLAGS', '')
6464
nvcc_flags = [] if nvcc_flags == '' else nvcc_flags.split(' ')
65-
nvcc_flags += ['-arch=sm_35', '--expt-relaxed-constexpr', '-O2']
65+
nvcc_flags += ['--expt-relaxed-constexpr', '-O2']
6666
extra_compile_args['nvcc'] = nvcc_flags
6767

6868
if sys.platform == 'win32':

0 commit comments

Comments
 (0)