Skip to content

Commit 553b95e

Browse files
committed
minor
1 parent 32433d1 commit 553b95e

File tree

1 file changed

+10
-3
lines changed

1 file changed

+10
-3
lines changed

flashinfer/fused_moe/core.py

Lines changed: 10 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1082,6 +1082,8 @@ def forward(
10821082
local_expert_offset: int,
10831083
routed_scaling_factor: Optional[float],
10841084
routing_method_type: int,
1085+
enable_pdl: bool,
1086+
do_finalize: bool,
10851087
tactic: int = -1,
10861088
do_preparation: bool = False,
10871089
):
@@ -1154,7 +1156,8 @@ def forward(
11541156
routed_scaling_factor,
11551157
tile_tokens_dim,
11561158
routing_method_type,
1157-
True, # do_finalize
1159+
enable_pdl,
1160+
do_finalize,
11581161
output,
11591162
tactic,
11601163
)
@@ -1476,6 +1479,8 @@ def trtllm_fp4_block_scale_moe_op(
14761479
local_expert_offset=local_expert_offset,
14771480
routed_scaling_factor=routed_scaling_factor,
14781481
routing_method_type=routing_method_type,
1482+
enable_pdl=enable_pdl,
1483+
do_finalize=do_finalize,
14791484
)
14801485

14811486
# Call the C++ function for block scale MoE
@@ -1547,8 +1552,9 @@ def _fake_trtllm_fp4_block_scale_moe(
15471552
tile_tokens_dim: int,
15481553
routing_method_type: int,
15491554
do_finalize: bool,
1550-
enable_pdl: Optional[bool] = None,
1551-
output: Optional[torch.Tensor] = None,
1555+
enable_pdl: bool,
1556+
tune_max_num_tokens: int,
1557+
output: Optional[torch.Tensor],
15521558
):
15531559
seq_len = hidden_states.shape[0]
15541560
hidden_size = hidden_states.shape[1]
@@ -1789,6 +1795,7 @@ def trtllm_fp4_block_scale_moe(
17891795
List[torch.Tensor]: List of output tensors. If do_finalize=True, returns the final MoE output.
17901796
Otherwise, returns intermediate results (gemm2_output, expert_weights, expanded_idx_to_permuted_idx) that need further processing.
17911797
"""
1798+
print(f"in trtllm_fp4_block_scale_moe, tune_max_num_tokens={tune_max_num_tokens}")
17921799
return get_trtllm_moe_sm100_module().trtllm_fp4_block_scale_moe(
17931800
routing_logits,
17941801
None,

0 commit comments

Comments
 (0)