File tree Expand file tree Collapse file tree 1 file changed +8
-6
lines changed Expand file tree Collapse file tree 1 file changed +8
-6
lines changed Original file line number Diff line number Diff line change @@ -177,7 +177,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
177177 include (FetchContent)
178178 SET (CUTLASS_ENABLE_HEADERS_ONLY=ON )
179179 FetchContent_Declare(
180- cutlass
180+ cutlass
181181 GIT_REPOSITORY https://github.com/nvidia/cutlass.git
182182 # CUTLASS 3.5.0
183183 GIT_TAG 7d49e6c7e2f8896c47f586706e67e1fb215529dc
@@ -200,11 +200,13 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
200200 # The CUTLASS kernels for Hopper require sm90a to be enabled.
201201 # This is done via the below gencode option, BUT that creates kernels for both sm90 and sm90a.
202202 # That adds an extra 17MB to compiled binary, so instead we selectively enable it.
203- set_source_files_properties (
204- "csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu"
205- PROPERTIES
206- COMPILE_FLAGS
207- "-gencode arch=compute_90a,code=sm_90a" )
203+ if (${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 11)
204+ set_source_files_properties (
205+ "csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu"
206+ PROPERTIES
207+ COMPILE_FLAGS
208+ "-gencode arch=compute_90a,code=sm_90a" )
209+ endif ()
208210
209211endif ()
210212
You can’t perform that action at this time.
0 commit comments