File tree Expand file tree Collapse file tree 2 files changed +4
-0
lines changed Expand file tree Collapse file tree 2 files changed +4
-0
lines changed Original file line number Diff line number Diff line change 57
57
gen_gemm_sm120_module ,
58
58
gen_gemm_sm120_module_cutlass_fp4 ,
59
59
gen_trtllm_gen_gemm_module ,
60
+ gen_trtllm_low_latency_gemm_module ,
60
61
)
61
62
from .jit .spdlog import gen_spdlog_module
62
63
from .jit .mla import gen_mla_module
@@ -460,6 +461,7 @@ def gen_all_modules(
460
461
)
461
462
jit_specs .append (gen_mxfp8_quantization_sm100_module ())
462
463
jit_specs .append (gen_trtllm_gen_gemm_module ())
464
+ jit_specs .append (gen_trtllm_low_latency_gemm_module ())
463
465
jit_specs .append (gen_trtllm_gen_fused_moe_sm100_module ())
464
466
if has_sm100f :
465
467
# Add TGV GEMM modules compiled with SM100f flags for both bf16 and fp16
Original file line number Diff line number Diff line change 22
22
gen_gemm_sm100_module ,
23
23
gen_gemm_sm120_module ,
24
24
gen_trtllm_gen_gemm_module ,
25
+ gen_trtllm_low_latency_gemm_module ,
25
26
gen_tgv_gemm_sm10x_module ,
26
27
gen_gemm_sm90_module ,
27
28
)
35
36
"gen_gemm_sm100_module" ,
36
37
"gen_gemm_sm120_module" ,
37
38
"gen_trtllm_gen_gemm_module" ,
39
+ "gen_trtllm_low_latency_gemm_module" ,
38
40
"gen_tgv_gemm_sm10x_module" ,
39
41
"gen_gemm_sm90_module" ,
40
42
"gen_deepgemm_sm100_module" ,
You can’t perform that action at this time.
0 commit comments