File tree Expand file tree Collapse file tree 2 files changed +12
-1
lines changed Expand file tree Collapse file tree 2 files changed +12
-1
lines changed Original file line number Diff line number Diff line change 25
25
as_reward_model ,
26
26
as_seq_cls_model )
27
27
from vllm .model_executor .models .interfaces import SupportsQuant
28
- from vllm .model_executor .models .registry import _TRANSFORMERS_MODELS
28
+ from vllm .model_executor .models .registry import (_PREVIOUSLY_SUPPORTED_MODELS ,
29
+ _TRANSFORMERS_MODELS )
29
30
from vllm .utils import is_pin_memory_available
30
31
31
32
logger = init_logger (__name__ )
@@ -261,6 +262,14 @@ def get_model_architecture(
261
262
vllm_not_supported = False
262
263
break
263
264
265
+ if any (arch in _PREVIOUSLY_SUPPORTED_MODELS for arch in architectures ):
266
+ previous_version = _PREVIOUSLY_SUPPORTED_MODELS [architectures [0 ]]
267
+ raise ValueError (
268
+ f"Model architecture { architectures [0 ]} was supported"
269
+ f" in vLLM until version { previous_version } , and is "
270
+ "not supported anymore. Please use an older version"
271
+ " of vLLM if you want to use this model architecture." )
272
+
264
273
if (model_config .model_impl == ModelImpl .TRANSFORMERS or
265
274
model_config .model_impl == ModelImpl .AUTO and vllm_not_supported ):
266
275
architectures = resolve_transformers_arch (model_config , architectures )
Original file line number Diff line number Diff line change 276
276
sys .executable , "-m" , "vllm.model_executor.models.registry"
277
277
]
278
278
279
+ _PREVIOUSLY_SUPPORTED_MODELS = {"Phi3SmallForCausalLM" : "0.9.2" }
280
+
279
281
280
282
@dataclass (frozen = True )
281
283
class _ModelInfo :
You can’t perform that action at this time.
0 commit comments