We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3ad438c commit 51c31bcCopy full SHA for 51c31bc
cmake/utils.cmake
@@ -240,9 +240,12 @@ macro(override_gpu_arches GPU_ARCHES GPU_LANG GPU_SUPPORTED_ARCHES)
240
endif()
241
242
if (_SM)
243
- set(_VIRT "")
+ # -real suffix let CMake to only generate elf code for the kernels.
244
+ # we want this, otherwise the added ptx (default) will increase binary size.
245
+ set(_VIRT "-real")
246
set(_CODE_ARCH ${_SM})
247
else()
248
+ # -virtual suffix let CMake to generate ptx code for the kernels.
249
set(_VIRT "-virtual")
250
set(_CODE_ARCH ${_CODE})
251
0 commit comments