|
1 | 1 | SUPPORTED_BASE_MODELS = [ |
2 | | - # qwen1.5 |
3 | | - "Qwen/Qwen1.5-0.5B", |
4 | | - "Qwen/Qwen1.5-0.5B-Chat", |
5 | | - "Qwen/Qwen1.5-1.8B", |
6 | | - "Qwen/Qwen1.5-1.8B-Chat", |
7 | | - "Qwen/Qwen1.5-4B", |
8 | | - "Qwen/Qwen1.5-4B-Chat", |
9 | | - "Qwen/Qwen1.5-7B", |
10 | | - "Qwen/Qwen1.5-7B-Chat", |
11 | | - "Qwen/Qwen1.5-14B", |
12 | | - "Qwen/Qwen1.5-14B-Chat", |
13 | | - "Qwen/Qwen1.5-32B", |
14 | | - "Qwen/Qwen1.5-32B-Chat", |
15 | | - "Qwen/Qwen1.5-72B", |
16 | | - "Qwen/Qwen1.5-72B-Chat", |
17 | | - # qwen2 |
18 | | - "Qwen/Qwen2-0.5B", |
19 | | - "Qwen/Qwen2-0.5B-Instruct", |
20 | | - "Qwen/Qwen2-1.5B", |
21 | | - "Qwen/Qwen2-1.5B-Instruct", |
22 | | - "Qwen/Qwen2-7B", |
23 | | - "Qwen/Qwen2-7B-Instruct", |
24 | | - "Qwen/Qwen2-72B", |
25 | | - "Qwen/Qwen2-72B-Instruct", |
26 | 2 | # qwen2.5 |
27 | 3 | "Qwen/Qwen2.5-0.5B", |
28 | 4 | "Qwen/Qwen2.5-0.5B-Instruct", |
|
38 | 14 | "Qwen/Qwen2.5-32B-Instruct", |
39 | 15 | "Qwen/Qwen2.5-72B", |
40 | 16 | "Qwen/Qwen2.5-72B-Instruct", |
41 | | - # Yi |
42 | | - "01-ai/Yi-6B", |
43 | | - "01-ai/Yi-6B-Chat", |
44 | | - "01-ai/Yi-9B", |
45 | | - "01-ai/Yi-9B-Chat", |
46 | | - "01-ai/Yi-34B", |
47 | | - "01-ai/Yi-34B-Chat", |
48 | 17 | # yi 1.5 |
49 | 18 | "01-ai/Yi-1.5-6B", |
50 | 19 | "01-ai/Yi-1.5-6B-Chat", |
|
53 | 22 | "01-ai/Yi-1.5-34B", |
54 | 23 | "01-ai/Yi-1.5-34B-Chat", |
55 | 24 | # mistral |
56 | | - "mistralai/Mistral-7B-v0.1", |
57 | 25 | "mistralai/Mistral-7B-v0.3", |
58 | | - "mistralai/Mistral-7B-Instruct-v0.1", |
59 | | - "mistralai/Mistral-7B-Instruct-v0.2", |
60 | 26 | "mistralai/Mistral-7B-Instruct-v0.3", |
61 | 27 | "mistralai/Ministral-8B-Instruct-2410", |
62 | | - # mixtral |
63 | | - "mistralai/Mixtral-8x7B-v0.1", |
64 | | - "mistralai/Mixtral-8x7B-Instruct-v0.1", |
65 | | - # gemma |
66 | | - "google/gemma-2b", |
67 | | - "google/gemma-7b", |
68 | | - "google/gemma-2b-it", |
69 | | - "google/gemma-7b-it", |
70 | 28 | # gemma2 |
71 | 29 | "google/gemma-2-2b", |
72 | 30 | "google/gemma-2-9b", |
73 | 31 | "google/gemma-2-27b", |
74 | 32 | "google/gemma-2-2b-it", |
75 | 33 | "google/gemma-2-9b-it", |
76 | 34 | "google/gemma-2-27b-it", |
77 | | - # zephyr |
78 | | - "HuggingFaceH4/zephyr-7b-alpha", |
79 | | - "HuggingFaceH4/zephyr-7b-beta", |
80 | | - # llama2 |
81 | | - "meta-llama/Llama-2-7b-hf", |
82 | | - "meta-llama/Llama-2-13b-hf", |
83 | | - "meta-llama/Llama-2-70b-hf", |
84 | | - "meta-llama/Llama-2-7b-chat-hf", |
85 | | - "meta-llama/Llama-2-13b-chat-hf", |
86 | | - "meta-llama/Llama-2-70b-chat-hf", |
87 | 35 | # llama3 |
88 | 36 | "meta-llama/Meta-Llama-3-8B", |
89 | 37 | "meta-llama/Meta-Llama-3-8B-Instruct", |
|
101 | 49 | # phi4 |
102 | 50 | "microsoft/Phi-4-mini-instruct", |
103 | 51 | "microsoft/phi-4", |
104 | | - # deepseek |
105 | | - "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", |
106 | | - "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", |
107 | | - "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", |
108 | | - "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", |
109 | | - "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", |
110 | | - "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", |
111 | 52 | ] |
0 commit comments