This repository was archived by the owner on Sep 4, 2025. It is now read-only.
File tree Expand file tree Collapse file tree 1 file changed +13
-2
lines changed Expand file tree Collapse file tree 1 file changed +13
-2
lines changed Original file line number Diff line number Diff line change @@ -195,9 +195,13 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
195
195
FetchContent_Declare(
196
196
cutlass
197
197
GIT_REPOSITORY https://github.com/nvidia/cutlass.git
198
- # CUTLASS 3.5.1
199
- GIT_TAG 06b21349bcf6ddf6a1686a47a137ad1446579db9
198
+ GIT_TAG v3.5.1
200
199
GIT_PROGRESS TRUE
200
+
201
+ # Speed up CUTLASS download by retrieving only the specified GIT_TAG instead of the history.
202
+ # Important: If GIT_SHALLOW is enabled then GIT_TAG works only with branch names and tags.
203
+ # So if the GIT_TAG above is updated to a commit hash, GIT_SHALLOW must be set to FALSE
204
+ GIT_SHALLOW TRUE
201
205
)
202
206
FetchContent_MakeAvailable(cutlass)
203
207
@@ -231,6 +235,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
231
235
"-gencode arch=compute_90a,code=sm_90a" )
232
236
endif ()
233
237
238
+
234
239
#
235
240
# Machete kernels
236
241
@@ -289,6 +294,12 @@ define_gpu_extension_target(
289
294
USE_SABI 3
290
295
WITH_SOABI)
291
296
297
+ # If CUTLASS is compiled on NVCC >= 12.5, it by default uses
298
+ # cudaGetDriverEntryPointByVersion as a wrapper to avoid directly calling the
299
+ # driver API. This causes problems when linking with earlier versions of CUDA.
300
+ # Setting this variable sidesteps the issue by calling the driver directly.
301
+ target_compile_definitions (_C PRIVATE CUTLASS_ENABLE_DIRECT_CUDA_DRIVER_CALL=1)
302
+
292
303
#
293
304
# _moe_C extension
294
305
#
You can’t perform that action at this time.
0 commit comments