68
68
from vllm .multimodal import MULTIMODAL_REGISTRY
69
69
70
70
from vllm_ascend .models .qwen2_5_vl import AscendQwen2_5_VisionRotaryEmbedding
71
+ from vllm_ascend .utils import vllm_version_is
71
72
72
73
73
74
class AscendQwen2_5_VisionAttention_Without_Padding (Qwen2_5_VisionAttention ):
@@ -483,12 +484,20 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
483
484
super ().__init__ (vllm_config = vllm_config , prefix = prefix )
484
485
config : Qwen2_5_VLConfig = vllm_config .model_config .hf_config
485
486
quant_config = vllm_config .quant_config
486
- self .visual = AscendQwen2_5_VisionTransformer_Without_Padding (
487
- vision_config = config .vision_config ,
488
- norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
489
- quant_config = self ._maybe_ignore_quant_config (quant_config ),
490
- prefix = maybe_prefix (prefix , "visual" ),
491
- )
487
+ if vllm_version_is ("0.10.2" ):
488
+ self .visual = AscendQwen2_5_VisionTransformer_Without_Padding (
489
+ vision_config = config .vision_config ,
490
+ norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
491
+ quant_config = self ._maybe_ignore_quant_config (quant_config ),
492
+ prefix = maybe_prefix (prefix , "visual" ),
493
+ )
494
+ else :
495
+ self .visual = AscendQwen2_5_VisionTransformer_Without_Padding (
496
+ vision_config = config .vision_config ,
497
+ norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
498
+ quant_config = self .quant_config ,
499
+ prefix = maybe_prefix (prefix , "visual" ),
500
+ )
492
501
493
502
def _process_image_input (self , image_input ) -> tuple [torch .Tensor , ...]:
494
503
@@ -554,12 +563,20 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
554
563
super ().__init__ (vllm_config = vllm_config , prefix = prefix )
555
564
config : Qwen3VLConfig = vllm_config .model_config .hf_config
556
565
quant_config = vllm_config .quant_config
557
- self .visual = AscendQwen3_VisionTransformer (
558
- config .vision_config ,
559
- norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
560
- quant_config = self ._maybe_ignore_quant_config (quant_config ),
561
- prefix = maybe_prefix (prefix , "visual" ),
562
- use_data_parallel = self .use_data_parallel )
566
+ if vllm_version_is ("0.10.2" ):
567
+ self .visual = AscendQwen3_VisionTransformer (
568
+ config .vision_config ,
569
+ norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
570
+ quant_config = self ._maybe_ignore_quant_config (quant_config ),
571
+ prefix = maybe_prefix (prefix , "visual" ),
572
+ use_data_parallel = self .use_data_parallel )
573
+ else :
574
+ self .visual = AscendQwen3_VisionTransformer (
575
+ config .vision_config ,
576
+ norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
577
+ quant_config = self .quant_config ,
578
+ prefix = maybe_prefix (prefix , "visual" ),
579
+ use_data_parallel = self .use_data_parallel )
563
580
564
581
565
582
@MULTIMODAL_REGISTRY .register_processor (Qwen3VLMultiModalProcessor ,
@@ -596,11 +613,19 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
596
613
multimodal_config = vllm_config .model_config .multimodal_config
597
614
self .multimodal_config = multimodal_config
598
615
self .use_data_parallel = multimodal_config .mm_encoder_tp_mode == "data"
599
-
600
- self .visual = AscendQwen3_VisionTransformer (
601
- config .vision_config ,
602
- norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
603
- quant_config = self ._maybe_ignore_quant_config (quant_config ),
604
- prefix = maybe_prefix (prefix , "visual" ),
605
- use_data_parallel = self .use_data_parallel ,
606
- )
616
+ if vllm_version_is ("0.10.2" ):
617
+ self .visual = AscendQwen3_VisionTransformer (
618
+ config .vision_config ,
619
+ norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
620
+ quant_config = self ._maybe_ignore_quant_config (quant_config ),
621
+ prefix = maybe_prefix (prefix , "visual" ),
622
+ use_data_parallel = self .use_data_parallel ,
623
+ )
624
+ else :
625
+ self .visual = AscendQwen3_VisionTransformer (
626
+ config .vision_config ,
627
+ norm_eps = getattr (config , "rms_norm_eps" , 1e-6 ),
628
+ quant_config = self .quant_config ,
629
+ prefix = maybe_prefix (prefix , "visual" ),
630
+ use_data_parallel = self .use_data_parallel ,
631
+ )
0 commit comments