11{
2- "DeepSeek-R1-Distill-Qwen-1.5B" : {
3- "url" : " https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B.git" ,
4- "tensor_parallel_size" : 1
2+ "deepseek-r1-distill-qwen-1.5b" : {
3+ "name" : " deepseek-ai/DeepSeek-R1-Distill-Qwen-32B" ,
4+ "modelscope_url" : " https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B.git" ,
5+ "huggingface_url" : " https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B" ,
6+ "tensor_parallel_size" : [1 ]
57 },
6- "Qwen2.5-0.5B-Instruct" : {
7- "url" : " https://www.modelscope.cn/Qwen/Qwen2.5-0.5B-Instruct.git" ,
8- "tensor_parallel_size" : 1
8+
9+ "deepseek-r1-distill-llama-70b" : {
10+ "name" : " deepseek-ai/DeepSeek-R1-Distill-Llama-70B" ,
11+ "modelscope_url" : " https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Llama-70B.git" ,
12+ "huggingface_url" :" https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Llama-70B" ,
13+ "tensor_parallel_size" : [4 , 8 ]
14+ },
15+
16+ "deepseek-r1-distill-qwen-32b" : {
17+ "name" : " deepseek-ai/DeepSeek-R1-Distill-Qwen-32B" ,
18+ "modelscope_url" : " https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B.git" ,
19+ "huggingface_url" : " https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B" ,
20+ "tensor_parallel_size" : [2 , 4 ]
21+ },
22+
23+ "qwen2.5-0.5b-instruct" : {
24+ "name" : " Qwen/Qwen2.5-0.5B-Instruct" ,
25+ "modelscope_url" : " https://www.modelscope.cn/Qwen/Qwen2.5-0.5B-Instruct.git" ,
26+ "huggingface_url" : " https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct" ,
27+ "tensor_parallel_size" : [1 ]
928 }
10- }
29+ }
0 commit comments