@@ -1237,79 +1237,91 @@ def get_model_tokenizer_qwen1half_intx(model_dir: str,
12371237 'Shanghai_AI_Laboratory/internlm2-math-base-7b' ,
12381238 LoRATM .internlm2 ,
12391239 TemplateType .default_generation_bos ,
1240- support_flash_attn = True )
1240+ support_flash_attn = True ,
1241+ support_vllm = True )
12411242@register_model (
12421243 ModelType .internlm2_math_20b ,
12431244 'Shanghai_AI_Laboratory/internlm2-math-base-20b' ,
12441245 LoRATM .internlm2 ,
12451246 TemplateType .default_generation_bos ,
1246- support_flash_attn = True )
1247+ support_flash_attn = True ,
1248+ support_vllm = True )
12471249@register_model (
12481250 ModelType .internlm2_math_7b_chat ,
12491251 'Shanghai_AI_Laboratory/internlm2-math-7b' ,
12501252 LoRATM .internlm2 ,
12511253 TemplateType .internlm2 ,
12521254 eos_token = '<|im_end|>' ,
1253- support_flash_attn = True )
1255+ support_flash_attn = True ,
1256+ support_vllm = True )
12541257@register_model (
12551258 ModelType .internlm2_math_20b_chat ,
12561259 'Shanghai_AI_Laboratory/internlm2-math-20b' ,
12571260 LoRATM .internlm2 ,
12581261 TemplateType .internlm2 ,
12591262 eos_token = '<|im_end|>' ,
1260- support_flash_attn = True )
1263+ support_flash_attn = True ,
1264+ support_vllm = True )
12611265@register_model (
12621266 ModelType .internlm2_7b_sft_chat ,
12631267 'Shanghai_AI_Laboratory/internlm2-chat-7b-sft' ,
12641268 LoRATM .internlm2 ,
12651269 TemplateType .internlm2 ,
12661270 eos_token = '<|im_end|>' ,
1267- support_flash_attn = True )
1271+ support_flash_attn = True ,
1272+ support_vllm = True )
12681273@register_model (
12691274 ModelType .internlm2_7b_chat ,
12701275 'Shanghai_AI_Laboratory/internlm2-chat-7b' ,
12711276 LoRATM .internlm2 ,
12721277 TemplateType .internlm2 ,
12731278 eos_token = '<|im_end|>' ,
1274- support_flash_attn = True )
1279+ support_flash_attn = True ,
1280+ support_vllm = True )
12751281@register_model (
12761282 ModelType .internlm2_20b_sft_chat ,
12771283 'Shanghai_AI_Laboratory/internlm2-chat-20b-sft' ,
12781284 LoRATM .internlm2 ,
12791285 TemplateType .internlm2 ,
12801286 eos_token = '<|im_end|>' ,
1281- support_flash_attn = True )
1287+ support_flash_attn = True ,
1288+ support_vllm = True )
12821289@register_model (
12831290 ModelType .internlm2_20b_chat ,
12841291 'Shanghai_AI_Laboratory/internlm2-chat-20b' ,
12851292 LoRATM .internlm2 ,
12861293 TemplateType .internlm2 ,
12871294 eos_token = '<|im_end|>' ,
1288- support_flash_attn = True )
1295+ support_flash_attn = True ,
1296+ support_vllm = True )
12891297@register_model (
12901298 ModelType .internlm2_7b ,
12911299 'Shanghai_AI_Laboratory/internlm2-7b' ,
12921300 LoRATM .internlm2 ,
12931301 TemplateType .default_generation_bos ,
1294- support_flash_attn = True )
1302+ support_flash_attn = True ,
1303+ support_vllm = True )
12951304@register_model (
12961305 ModelType .internlm2_7b_base ,
12971306 'Shanghai_AI_Laboratory/internlm2-base-7b' ,
12981307 LoRATM .internlm2 ,
12991308 TemplateType .default_generation_bos ,
1300- support_flash_attn = True )
1309+ support_flash_attn = True ,
1310+ support_vllm = True )
13011311@register_model (
13021312 ModelType .internlm2_20b ,
13031313 'Shanghai_AI_Laboratory/internlm2-20b' ,
13041314 LoRATM .internlm2 ,
13051315 TemplateType .default_generation_bos ,
1306- support_flash_attn = True )
1316+ support_flash_attn = True ,
1317+ support_vllm = True )
13071318@register_model (
13081319 ModelType .internlm2_20b_base ,
13091320 'Shanghai_AI_Laboratory/internlm2-base-20b' ,
13101321 LoRATM .internlm2 ,
13111322 TemplateType .default_generation_bos ,
1312- support_flash_attn = True )
1323+ support_flash_attn = True ,
1324+ support_vllm = True )
13131325def get_model_tokenizer_internlm2 (model_dir : str ,
13141326 torch_dtype : Dtype ,
13151327 model_kwargs : Dict [str , Any ],
0 commit comments