Skip to content

Commit 0287d9a

Browse files
zhcn000000OliverBryant
authored andcommitted
FEAT: Add vllm multi model support (#4126)
1 parent 2a82544 commit 0287d9a

File tree

5 files changed

+224
-54
lines changed

5 files changed

+224
-54
lines changed

doc/source/gen_docs.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -81,8 +81,8 @@ def mock_platform_checks():
8181
vllm_core.VLLMModel._has_cuda_device = lambda: True
8282
vllm_core.VLLMChatModel._is_linux = lambda: True
8383
vllm_core.VLLMChatModel._has_cuda_device = lambda: True
84-
vllm_core.VLLMVisionModel._is_linux = lambda: True
85-
vllm_core.VLLMVisionModel._has_cuda_device = lambda: True
84+
vllm_core.VLLMMultiModel._is_linux = lambda: True
85+
vllm_core.VLLMMultiModel._has_cuda_device = lambda: True
8686

8787
# Mock SGLang platform checks if available
8888
try:

xinference/model/llm/__init__.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -179,12 +179,12 @@ def _install():
179179
from .mlx.core import MLXChatModel, MLXModel, MLXVisionModel
180180
from .sglang.core import SGLANGChatModel, SGLANGModel, SGLANGVisionModel
181181
from .transformers.core import PytorchChatModel, PytorchModel
182-
from .vllm.core import VLLMChatModel, VLLMModel, VLLMVisionModel
182+
from .vllm.core import VLLMChatModel, VLLMModel, VLLMMultiModel
183183

184184
# register llm classes.
185185
LLAMA_CLASSES.extend([XllamaCppModel])
186186
SGLANG_CLASSES.extend([SGLANGModel, SGLANGChatModel, SGLANGVisionModel])
187-
VLLM_CLASSES.extend([VLLMModel, VLLMChatModel, VLLMVisionModel])
187+
VLLM_CLASSES.extend([VLLMModel, VLLMChatModel, VLLMMultiModel])
188188
MLX_CLASSES.extend([MLXModel, MLXChatModel, MLXVisionModel])
189189
LMDEPLOY_CLASSES.extend([LMDeployModel, LMDeployChatModel])
190190
TRANSFORMERS_CLASSES.extend([PytorchChatModel, PytorchModel])

0 commit comments

Comments
 (0)