fix

hiworldwzj · web-flow · commit 563b8ea89505 · 2025-09-01T14:29:49.000+08:00
diff --git a/lightllm/common/basemodel/layer_weights/meta_weights/fused_moe_weight_ep.py b/lightllm/common/basemodel/layer_weights/meta_weights/fused_moe_weight_ep.py
@@ -360,8 +360,7 @@ def prefilled_group_gemm(
             # here is used to match autotune feature, make moe model run same triton kernel in different rank.
             # in some special case, one rank will recv 0 token, so add a token to make it run triton kernel.
             if (
-                get_triton_autotune_level() != AutotuneLevel.NO_AUTOTUNE
-                and get_triton_autotune_level() != AutotuneLevel.CLOSE_AUTOTUNE
+                get_triton_autotune_level() in [AutotuneLevel.ADAPTIVE_AUTOTUNE, AutotuneLevel.FORCE_AUTOTUNE]
             ):
                 _gemm_out_a = torch.zeros((1, N), device=device, dtype=hidden_dtype)
                 _silu_out = torch.zeros((1, N // 2), device=device, dtype=hidden_dtype)
diff --git a/lightllm/common/fused_moe/grouped_fused_moe_ep.py b/lightllm/common/fused_moe/grouped_fused_moe_ep.py
@@ -193,8 +193,7 @@ def fused_experts_impl(
             # here is used to match autotune feature, make moe model run same triton kernel in different rank.
             # in some special case, one rank will recv 0 token, so add a token to make it run triton kernel.
             if (
-                get_triton_autotune_level() != AutotuneLevel.NO_AUTOTUNE
-                and get_triton_autotune_level() != AutotuneLevel.CLOSE_AUTOTUNE
+                get_triton_autotune_level() in [AutotuneLevel.ADAPTIVE_AUTOTUNE, AutotuneLevel.FORCE_AUTOTUNE]
             ):
                 _gemm_out_a = torch.zeros((1, N), device=hidden_states.device, dtype=hidden_states.dtype)
                 _silu_out = torch.zeros((1, N // 2), device=hidden_states.device, dtype=hidden_states.dtype)