We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c3d9883 commit 2a7c3a8Copy full SHA for 2a7c3a8
csrc/setup_cuda.py
@@ -226,6 +226,8 @@ def get_gencode_flags():
226
"gpu/fp8_gemm_with_cutlass/fp8_fp8_half_block_gemm.cu",
227
"gpu/fp8_gemm_with_cutlass/fp8_fp8_half_gemm_ptr_scale.cu",
228
]
229
+ sources += find_end_files("./gpu/mla_attn", ".cu")
230
+
231
sources += [
232
"gpu/sparse/sparse_compressor.cu",
233
"gpu/sparse/sparse_mm.cu",
0 commit comments