File tree Expand file tree Collapse file tree 4 files changed +342
-125
lines changed Expand file tree Collapse file tree 4 files changed +342
-125
lines changed Original file line number Diff line number Diff line change @@ -324,6 +324,8 @@ class FusedMoEConfig:
324
324
325
325
max_num_tokens : int = envs .VLLM_MOE_DP_CHUNK_SIZE
326
326
327
+ has_bias : bool = False
328
+
327
329
def __post_init__ (self ):
328
330
if self .dp_size > 1 :
329
331
logger .debug_once ("Using FusedMoEConfig::max_num_tokens=%d" ,
@@ -413,7 +415,8 @@ def make(
413
415
in_dtype : torch .dtype ,
414
416
max_num_tokens : int = envs .VLLM_MOE_DP_CHUNK_SIZE ,
415
417
quant_config : Optional [Union [FusedMoEQuantConfig ,
416
- QuantizationConfig ]] = None
418
+ QuantizationConfig ]] = None ,
419
+ has_bias : bool = False ,
417
420
) -> "FusedMoEConfig" :
418
421
419
422
_quant_config : Optional [FusedMoEQuantConfig ] = None
@@ -482,4 +485,5 @@ def make(
482
485
in_dtype = in_dtype ,
483
486
quant_config = _quant_config ,
484
487
max_num_tokens = max_num_tokens ,
488
+ has_bias = has_bias ,
485
489
)
You can’t perform that action at this time.
0 commit comments