Skip to content
This repository was archived by the owner on Sep 4, 2025. It is now read-only.

Commit 4bb98f2

Browse files
authored
[Misc] Update config loading for Qwen2-VL and remove Granite (vllm-project#8837)
1 parent 7193774 commit 4bb98f2

File tree

7 files changed

+144
-224
lines changed

7 files changed

+144
-224
lines changed

docs/source/models/supported_models.rst

Lines changed: 1 addition & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -280,7 +280,7 @@ Multimodal Language Models
280280
- :code:`Qwen/Qwen-VL`, :code:`Qwen/Qwen-VL-Chat`, etc.
281281
-
282282
* - :code:`Qwen2VLForConditionalGeneration`
283-
- Qwen2-VL (see note)
283+
- Qwen2-VL
284284
- Image\ :sup:`+` / Video\ :sup:`+`
285285
- :code:`Qwen/Qwen2-VL-2B-Instruct`, :code:`Qwen/Qwen2-VL-7B-Instruct`, :code:`Qwen/Qwen2-VL-72B-Instruct`, etc.
286286
-
@@ -297,15 +297,6 @@ Multimodal Language Models
297297
For :code:`openbmb/MiniCPM-V-2`, the official repo doesn't work yet, so we need to use a fork (:code:`HwwwH/MiniCPM-V-2`) for now.
298298
For more details, please see: https://github.com/vllm-project/vllm/pull/4087#issuecomment-2250397630
299299

300-
.. note::
301-
For :code:`Qwen2-VL`, the latest release of :code:`huggingface/transformers` doesn't work yet, so we need to use a developer version (:code:`21fac7abba2a37fae86106f87fcf9974fd1e3830`) for now.
302-
This can be installed by running the following command:
303-
304-
.. code-block:: bash
305-
306-
pip install git+https://github.com/huggingface/transformers.git@21fac7abba2a37fae86106f87fcf9974fd1e3830
307-
308-
----
309300

310301
If your model uses one of the above model architectures, you can seamlessly run your model with vLLM.
311302
Otherwise, please refer to :ref:`Adding a New Model <adding_a_new_model>` and :ref:`Enabling Multimodal Inputs <enabling_multimodal_inputs>`

vllm/model_executor/models/granite.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@
2525

2626
import torch
2727
from torch import nn
28+
from transformers import GraniteConfig
2829

2930
from vllm.attention import Attention, AttentionMetadata
3031
from vllm.config import CacheConfig, LoRAConfig
@@ -48,7 +49,6 @@
4849
default_weight_loader, kv_cache_scales_loader, maybe_remap_kv_scale_name)
4950
from vllm.model_executor.sampling_metadata import SamplingMetadata
5051
from vllm.sequence import IntermediateTensors
51-
from vllm.transformers_utils.configs.granite import GraniteConfig
5252
from vllm.utils import is_hip
5353

5454
from .interfaces import SupportsLoRA

vllm/model_executor/models/qwen2_vl.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -31,12 +31,9 @@
3131
import torch.nn.functional as F
3232
from einops import rearrange, repeat
3333
from PIL import Image
34-
from transformers import Qwen2VLConfig
3534
from transformers.image_utils import (get_image_size,
3635
infer_channel_dimension_format,
3736
to_numpy_array)
38-
from transformers.models.qwen2_vl.configuration_qwen2_vl import (
39-
Qwen2VLVisionConfig)
4037
from transformers.models.qwen2_vl.image_processing_qwen2_vl import (
4138
make_batched_images, make_batched_videos, smart_resize)
4239

@@ -66,6 +63,8 @@
6663
from vllm.multimodal.image import cached_get_image_processor
6764
from vllm.platforms import current_platform
6865
from vllm.sequence import IntermediateTensors, SequenceData
66+
from vllm.transformers_utils.configs.qwen2vl import (Qwen2VLConfig,
67+
Qwen2VLVisionConfig)
6968
from vllm.transformers_utils.processor import get_processor
7069
from vllm.utils import is_cpu
7170

vllm/transformers_utils/config.py

Lines changed: 5 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -20,10 +20,10 @@
2020
# yapf: disable
2121
from vllm.transformers_utils.configs import (ChatGLMConfig, DbrxConfig,
2222
EAGLEConfig, ExaoneConfig,
23-
GraniteConfig, InternVLChatConfig,
24-
JAISConfig, MedusaConfig,
25-
MllamaConfig, MLPSpeculatorConfig,
26-
MPTConfig, NemotronConfig,
23+
InternVLChatConfig, JAISConfig,
24+
MedusaConfig, MllamaConfig,
25+
MLPSpeculatorConfig, MPTConfig,
26+
NemotronConfig, Qwen2VLConfig,
2727
RWConfig, SolarConfig,
2828
UltravoxConfig)
2929
# yapf: enable
@@ -57,9 +57,7 @@
5757
"nemotron": NemotronConfig,
5858
"solar": SolarConfig,
5959
"ultravox": UltravoxConfig,
60-
# Granite can be removed from here once we have upgraded to
61-
# transformers 4.45+
62-
"granite": GraniteConfig,
60+
"qwen2_vl": Qwen2VLConfig,
6361
**_CONFIG_REGISTRY_OVERRIDE_HF
6462
}
6563

vllm/transformers_utils/configs/__init__.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,14 +6,15 @@
66
# tiiuae/falcon-7b(-instruct) models. Newer Falcon models will use the
77
# `FalconConfig` class from the official HuggingFace transformers library.
88
from vllm.transformers_utils.configs.falcon import RWConfig
9-
from vllm.transformers_utils.configs.granite import GraniteConfig
109
from vllm.transformers_utils.configs.internvl import InternVLChatConfig
1110
from vllm.transformers_utils.configs.jais import JAISConfig
1211
from vllm.transformers_utils.configs.medusa import MedusaConfig
1312
from vllm.transformers_utils.configs.mllama import MllamaConfig
1413
from vllm.transformers_utils.configs.mlp_speculator import MLPSpeculatorConfig
1514
from vllm.transformers_utils.configs.mpt import MPTConfig
1615
from vllm.transformers_utils.configs.nemotron import NemotronConfig
16+
from vllm.transformers_utils.configs.qwen2vl import (Qwen2VLConfig,
17+
Qwen2VLVisionConfig)
1718
from vllm.transformers_utils.configs.solar import SolarConfig
1819
from vllm.transformers_utils.configs.ultravox import UltravoxConfig
1920

@@ -32,7 +33,6 @@
3233
"NemotronConfig",
3334
"SolarConfig",
3435
"UltravoxConfig",
35-
# Granite can be removed from here once we have upgraded to
36-
# transformers 4.45+
37-
"GraniteConfig",
36+
"Qwen2VLConfig",
37+
"Qwen2VLVisionConfig",
3838
]

vllm/transformers_utils/configs/granite.py

Lines changed: 0 additions & 199 deletions
This file was deleted.

0 commit comments

Comments
 (0)