File tree Expand file tree Collapse file tree 1 file changed +3
-2
lines changed
vllm/model_executor/layers/fused_moe Expand file tree Collapse file tree 1 file changed +3
-2
lines changed Original file line number Diff line number Diff line change @@ -835,15 +835,16 @@ def __init__(
835
835
836
836
if quant_config is None :
837
837
quant_method = UnquantizedFusedMoEMethod (moe )
838
+ prepare_finalize = _construct_prepare_finalize (moe , quant_config )
838
839
else :
839
840
quant_method = quant_config .get_quant_method (self , prefix )
841
+ # No pplx for quantized types yet.
842
+ prepare_finalize = None
840
843
841
844
assert quant_method is not None
842
845
assert isinstance (quant_method , FusedMoEMethodBase )
843
846
self .quant_method = quant_method
844
847
845
- prepare_finalize = _construct_prepare_finalize (moe , quant_config )
846
-
847
848
if prepare_finalize is not None :
848
849
world_size = moe .ep_size
849
850
dp_size = int (moe .ep_size // moe .dp_size )
You can’t perform that action at this time.
0 commit comments