Skip to content

Commit 90938c4

Browse files
committed
fix bug of cuda-11 compilation
1 parent fd66059 commit 90938c4

File tree

1 file changed

+23
-1
lines changed

1 file changed

+23
-1
lines changed

source/op/cuda/CMakeLists.txt

Lines changed: 23 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,17 @@ include_directories(cub)
1919

2020
message(STATUS "CUDA major version is " ${CUDA_VERSION_MAJOR})
2121

22-
if (${CUDA_VERSION_MAJOR} GREATER "10")
22+
if (${CUDA_VERSION_MAJOR} GREATER "11")
23+
# nvcc flags
24+
set(CUDA_NVCC_FLAGS -gencode arch=compute_60,code=sm_60; # Pascal – GP100/Tesla P100 – DGX-1 (Generic Pascal)
25+
-gencode arch=compute_61,code=sm_61; # Pascal - GTX 1080, GTX 1070, GTX 1060, GTX 1050, GTX 1030, Titan Xp, Tesla P40, Tesla P4, Discrete GPU on the NVIDIA Drive PX2
26+
-gencode arch=compute_70,code=sm_70; # Volta - GV100/Tesla V100, GTX 1180 (GV104)
27+
-gencode arch=compute_75,code=sm_75; # Turing - RTX 2080, Titan RTX, Quadro R8000
28+
-gencode arch=compute_80,code=sm_80; # Anpere - A100
29+
-gencode arch=compute_86,code=sm_86; # Anpere - RTX 3090
30+
-O3; -Xcompiler -fPIC;
31+
)
32+
elseif (${CUDA_VERSION_MAJOR} STREQUAL "11" AND ${CUDA_VERSION_MINOR} GREATER "0")
2333
# nvcc flags
2434
set(CUDA_NVCC_FLAGS -gencode arch=compute_50,code=sm_50;
2535
-gencode arch=compute_52,code=sm_52; # Tesla M40, Tesla M40, Quadro M6000...
@@ -32,6 +42,18 @@ if (${CUDA_VERSION_MAJOR} GREATER "10")
3242
-gencode arch=compute_86,code=sm_86; # Anpere - RTX 3090
3343
-O3; -Xcompiler -fPIC;
3444
)
45+
elseif (${CUDA_VERSION_MAJOR} STREQUAL "11" AND ${CUDA_VERSION_MINOR} STREQUAL "0")
46+
# nvcc flags
47+
set(CUDA_NVCC_FLAGS -gencode arch=compute_50,code=sm_50;
48+
-gencode arch=compute_52,code=sm_52; # Tesla M40, Tesla M40, Quadro M6000...
49+
-gencode arch=compute_53,code=sm_53;
50+
-gencode arch=compute_60,code=sm_60; # Pascal – GP100/Tesla P100 – DGX-1 (Generic Pascal)
51+
-gencode arch=compute_61,code=sm_61; # Pascal - GTX 1080, GTX 1070, GTX 1060, GTX 1050, GTX 1030, Titan Xp, Tesla P40, Tesla P4, Discrete GPU on the NVIDIA Drive PX2
52+
-gencode arch=compute_70,code=sm_70; # Volta - GV100/Tesla V100, GTX 1180 (GV104)
53+
-gencode arch=compute_75,code=sm_75; # Turing - RTX 2080, Titan RTX, Quadro R8000
54+
-gencode arch=compute_80,code=sm_80; # Anpere - A100
55+
-O3; -Xcompiler -fPIC;
56+
)
3557
elseif (${CUDA_VERSION_MAJOR} STREQUAL "10")
3658
set(CUDA_NVCC_FLAGS -gencode arch=compute_30,code=sm_30; # Tesla K10, Quadro K600 K420 K410,
3759
-gencode arch=compute_35,code=sm_35; # Tesla K20 K40, TITAN Z Black, GTX 780Ti 780

0 commit comments

Comments
 (0)