xorbitsai
diff --git a/‎doc/source/gen_docs.py‎
Lines changed: 2 additions & 2 deletions b/‎doc/source/gen_docs.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎xinference/model/llm/__init__.py‎
Lines changed: 2 additions & 2 deletions b/‎xinference/model/llm/__init__.py‎
Lines changed: 2 additions & 2 deletions
@@ -81,8 +81,8 @@ def mock_platform_checks():
     vllm_core.VLLMModel._has_cuda_device = lambda: True
     vllm_core.VLLMChatModel._is_linux = lambda: True
     vllm_core.VLLMChatModel._has_cuda_device = lambda: True
-    vllm_core.VLLMVisionModel._is_linux = lambda: True
-    vllm_core.VLLMVisionModel._has_cuda_device = lambda: True
+    vllm_core.VLLMMultiModel._is_linux = lambda: True
+    vllm_core.VLLMMultiModel._has_cuda_device = lambda: True
 
     # Mock SGLang platform checks if available
     try:
 
@@ -179,12 +179,12 @@ def _install():
     from .mlx.core import MLXChatModel, MLXModel, MLXVisionModel
     from .sglang.core import SGLANGChatModel, SGLANGModel, SGLANGVisionModel
     from .transformers.core import PytorchChatModel, PytorchModel
-    from .vllm.core import VLLMChatModel, VLLMModel, VLLMVisionModel
+    from .vllm.core import VLLMChatModel, VLLMModel, VLLMMultiModel
 
     # register llm classes.
     LLAMA_CLASSES.extend([XllamaCppModel])
     SGLANG_CLASSES.extend([SGLANGModel, SGLANGChatModel, SGLANGVisionModel])
-    VLLM_CLASSES.extend([VLLMModel, VLLMChatModel, VLLMVisionModel])
+    VLLM_CLASSES.extend([VLLMModel, VLLMChatModel, VLLMMultiModel])
     MLX_CLASSES.extend([MLXModel, MLXChatModel, MLXVisionModel])
     LMDEPLOY_CLASSES.extend([LMDeployModel, LMDeployChatModel])
     TRANSFORMERS_CLASSES.extend([PytorchChatModel, PytorchModel])