|
68 | 68 | from vllm.multimodal import MULTIMODAL_REGISTRY
|
69 | 69 |
|
70 | 70 | from vllm_ascend.models.qwen2_5_vl import AscendQwen2_5_VisionRotaryEmbedding
|
71 |
| -from vllm_ascend.utils import vllm_version_is |
72 | 71 |
|
73 | 72 |
|
74 | 73 | class AscendQwen2_5_VisionAttention_Without_Padding(Qwen2_5_VisionAttention):
|
@@ -484,20 +483,12 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
|
484 | 483 | super().__init__(vllm_config=vllm_config, prefix=prefix)
|
485 | 484 | config: Qwen2_5_VLConfig = vllm_config.model_config.hf_config
|
486 | 485 | quant_config = vllm_config.quant_config
|
487 |
| - if vllm_version_is("0.10.2"): |
488 |
| - self.visual = AscendQwen2_5_VisionTransformer_Without_Padding( |
489 |
| - vision_config=config.vision_config, |
490 |
| - norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
491 |
| - quant_config=self._maybe_ignore_quant_config(quant_config), |
492 |
| - prefix=maybe_prefix(prefix, "visual"), |
493 |
| - ) |
494 |
| - else: |
495 |
| - self.visual = AscendQwen2_5_VisionTransformer_Without_Padding( |
496 |
| - vision_config=config.vision_config, |
497 |
| - norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
498 |
| - quant_config=quant_config, |
499 |
| - prefix=maybe_prefix(prefix, "visual"), |
500 |
| - ) |
| 486 | + self.visual = AscendQwen2_5_VisionTransformer_Without_Padding( |
| 487 | + vision_config=config.vision_config, |
| 488 | + norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
| 489 | + quant_config=quant_config, |
| 490 | + prefix=maybe_prefix(prefix, "visual"), |
| 491 | + ) |
501 | 492 |
|
502 | 493 | def _process_image_input(self, image_input) -> tuple[torch.Tensor, ...]:
|
503 | 494 |
|
@@ -563,20 +554,12 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
|
563 | 554 | super().__init__(vllm_config=vllm_config, prefix=prefix)
|
564 | 555 | config: Qwen3VLConfig = vllm_config.model_config.hf_config
|
565 | 556 | quant_config = vllm_config.quant_config
|
566 |
| - if vllm_version_is("0.10.2"): |
567 |
| - self.visual = AscendQwen3_VisionTransformer( |
568 |
| - config.vision_config, |
569 |
| - norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
570 |
| - quant_config=self._maybe_ignore_quant_config(quant_config), |
571 |
| - prefix=maybe_prefix(prefix, "visual"), |
572 |
| - use_data_parallel=self.use_data_parallel) |
573 |
| - else: |
574 |
| - self.visual = AscendQwen3_VisionTransformer( |
575 |
| - config.vision_config, |
576 |
| - norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
577 |
| - quant_config=quant_config, |
578 |
| - prefix=maybe_prefix(prefix, "visual"), |
579 |
| - use_data_parallel=self.use_data_parallel) |
| 557 | + self.visual = AscendQwen3_VisionTransformer( |
| 558 | + config.vision_config, |
| 559 | + norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
| 560 | + quant_config=quant_config, |
| 561 | + prefix=maybe_prefix(prefix, "visual"), |
| 562 | + use_data_parallel=self.use_data_parallel) |
580 | 563 |
|
581 | 564 |
|
582 | 565 | @MULTIMODAL_REGISTRY.register_processor(Qwen3VLMultiModalProcessor,
|
@@ -613,19 +596,10 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
|
613 | 596 | multimodal_config = vllm_config.model_config.multimodal_config
|
614 | 597 | self.multimodal_config = multimodal_config
|
615 | 598 | self.use_data_parallel = multimodal_config.mm_encoder_tp_mode == "data"
|
616 |
| - if vllm_version_is("0.10.2"): |
617 |
| - self.visual = AscendQwen3_VisionTransformer( |
618 |
| - config.vision_config, |
619 |
| - norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
620 |
| - quant_config=self._maybe_ignore_quant_config(quant_config), |
621 |
| - prefix=maybe_prefix(prefix, "visual"), |
622 |
| - use_data_parallel=self.use_data_parallel, |
623 |
| - ) |
624 |
| - else: |
625 |
| - self.visual = AscendQwen3_VisionTransformer( |
626 |
| - config.vision_config, |
627 |
| - norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
628 |
| - quant_config=quant_config, |
629 |
| - prefix=maybe_prefix(prefix, "visual"), |
630 |
| - use_data_parallel=self.use_data_parallel, |
631 |
| - ) |
| 599 | + self.visual = AscendQwen3_VisionTransformer( |
| 600 | + config.vision_config, |
| 601 | + norm_eps=getattr(config, "rms_norm_eps", 1e-6), |
| 602 | + quant_config=quant_config, |
| 603 | + prefix=maybe_prefix(prefix, "visual"), |
| 604 | + use_data_parallel=self.use_data_parallel, |
| 605 | + ) |
0 commit comments