File tree Expand file tree Collapse file tree 2 files changed +7
-1
lines changed
Expand file tree Collapse file tree 2 files changed +7
-1
lines changed Original file line number Diff line number Diff line change @@ -91,7 +91,7 @@ elseif(MSCCLPP_USE_CUDA)
9191 list (APPEND MSCCLPP_GPU_ARCHS 120)
9292 endif ()
9393elseif (MSCCLPP_USE_ROCM)
94- set (CMAKE_HIP_ARCHITECTURES gfx90a gfx941 gfx942)
94+ set (MSCCLPP_GPU_ARCHS gfx90a gfx941 gfx942)
9595endif ()
9696
9797message (STATUS "GPU architectures: ${MSCCLPP_GPU_ARCHS} " )
@@ -146,6 +146,9 @@ if(MSCCLPP_USE_CUDA)
146146 target_compile_definitions (mscclpp_obj PRIVATE MSCCLPP_USE_CUDA )
147147elseif (MSCCLPP_USE_ROCM)
148148 target_compile_definitions (mscclpp_obj PRIVATE MSCCLPP_USE_ROCM )
149+ foreach (arch ${MSCCLPP_GPU_ARCHS} )
150+ target_compile_options (mscclpp_obj PRIVATE --offload-arch=${arch} )
151+ endforeach ()
149152endif ()
150153if (MSCCLPP_ENABLE_TRACE)
151154 target_compile_definitions (mscclpp_obj PRIVATE MSCCLPP_ENABLE_TRACE )
Original file line number Diff line number Diff line change @@ -19,6 +19,9 @@ if(MSCCLPP_USE_CUDA)
1919 target_compile_definitions (mscclpp_nccl_obj PRIVATE MSCCLPP_USE_CUDA )
2020elseif (MSCCLPP_USE_ROCM)
2121 target_compile_definitions (mscclpp_nccl_obj PRIVATE MSCCLPP_USE_ROCM )
22+ foreach (arch ${MSCCLPP_GPU_ARCHS} )
23+ target_compile_options (mscclpp_nccl_obj PRIVATE --offload-arch=${arch} )
24+ endforeach ()
2225endif ()
2326if (MSCCLPP_NPKIT_FLAGS)
2427 target_compile_definitions (mscclpp_nccl_obj PRIVATE ${MSCCLPP_NPKIT_FLAGS} )
You can’t perform that action at this time.
0 commit comments