Skip to content

Commit d27949f

Browse files
committed
Revert "try remove volta as a dedicated target b (+1 squashed commits)"
This reverts commit ddba580.
1 parent ddba580 commit d27949f

File tree

2 files changed

+4
-2
lines changed

2 files changed

+4
-2
lines changed

CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -139,10 +139,10 @@ if (LLAMA_CUBLAS)
139139
elseif(CUDAToolkit_VERSION VERSION_GREATER 12)
140140
add_compile_definitions(GGML_CUDA_USE_GRAPHS) #try enable cuda graphs on cu12 build
141141
add_compile_definitions(KCPP_LIMIT_CUDA_MAX_ARCH=800)
142-
set(CMAKE_CUDA_ARCHITECTURES "50-virtual;61-virtual;75-virtual;80-virtual") # lowest CUDA 12 standard + lowest for integer intrinsics
142+
set(CMAKE_CUDA_ARCHITECTURES "50-virtual;61-virtual;70-virtual;75-virtual;80-virtual") # lowest CUDA 12 standard + lowest for integer intrinsics
143143
else()
144144
add_compile_definitions(KCPP_LIMIT_CUDA_MAX_ARCH=750) #will cause issues with ggml_cuda_highest_compiled_arch if removed
145-
set(CMAKE_CUDA_ARCHITECTURES "35-virtual;50-virtual;61-virtual;75-virtual") # lowest CUDA 12 standard + lowest for integer intrinsics
145+
set(CMAKE_CUDA_ARCHITECTURES "35-virtual;50-virtual;61-virtual;70-virtual;75-virtual") # lowest CUDA 12 standard + lowest for integer intrinsics
146146
endif()
147147
endif()
148148
message(STATUS "Using CUDA architectures: ${CMAKE_CUDA_ARCHITECTURES}")

Makefile

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -226,13 +226,15 @@ NVCCFLAGS += -Wno-deprecated-gpu-targets \
226226
-gencode arch=compute_35,code=compute_35 \
227227
-gencode arch=compute_50,code=compute_50 \
228228
-gencode arch=compute_61,code=compute_61 \
229+
-gencode arch=compute_70,code=compute_70 \
229230
-gencode arch=compute_75,code=compute_75 \
230231
-DKCPP_LIMIT_CUDA_MAX_ARCH=750
231232

232233
else ifdef LLAMA_ARCHES_CU12
233234
NVCCFLAGS += -Wno-deprecated-gpu-targets \
234235
-gencode arch=compute_50,code=compute_50 \
235236
-gencode arch=compute_61,code=compute_61 \
237+
-gencode arch=compute_70,code=compute_70 \
236238
-gencode arch=compute_75,code=compute_75 \
237239
-gencode arch=compute_80,code=compute_80 \
238240
-DKCPP_LIMIT_CUDA_MAX_ARCH=800

0 commit comments

Comments
 (0)