We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent be1a8e5 commit 916f902Copy full SHA for 916f902
vllm/model_executor/layers/fused_moe/fused_moe.py
@@ -765,7 +765,7 @@ def get_default_config(
765
# num_stages=3 can cause triton.runtime.errors.OutOfResources
766
# on ROCm, set it to 2 instead.
767
config = {
768
- "BLOCK_SIZE_M": 64 if not use_deep_gemm else dg.get_m_alignment_for_contiguous_layout(),
+ "BLOCK_SIZE_M": 64,
769
"BLOCK_SIZE_N": block_shape[0],
770
"BLOCK_SIZE_K": block_shape[1],
771
"GROUP_SIZE_M": 32,
0 commit comments