forked from lm-playpen/playpen
-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathmodel_registry.json
More file actions
118 lines (118 loc) · 3.42 KB
/
model_registry.json
File metadata and controls
118 lines (118 loc) · 3.42 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
[
{
"model_name": "smol-135m",
"backend": "huggingface_local",
"huggingface_id": "HuggingFaceTB/SmolLM-135M-Instruct",
"release_date": "2024-09-04",
"open_weight": true,
"parameters": "135M",
"languages": ["en"],
"context_size": "2048",
"license": {
"name": "Apache 2.0",
"url": "https://www.apache.org/licenses/LICENSE-2.0"
},
"model_config": {
"premade_chat_template": true,
"eos_to_cull": "<\\|im_end\\|>"
}
}, {
"model_name": "smol-135m-sft",
"backend": "huggingface_local",
"huggingface_id": "models/sft/smol-135m/checkpoint-63",
"release_date": "2024-09-04",
"open_weight": true,
"parameters": "135M",
"languages": ["en"],
"context_size": "2048",
"license": {
"name": "Apache 2.0",
"url": "https://www.apache.org/licenses/LICENSE-2.0"
},
"model_config": {
"premade_chat_template": true,
"eos_to_cull": "<\\|im_end\\|>"
}
}, {
"model_name": "Llama-3.1-8B-Instruct",
"backend": "huggingface_local",
"huggingface_id": "meta-llama/Meta-Llama-3.1-8B-Instruct",
"release_date": "2024-07-23",
"open_weight": true,
"parameters": "8B",
"languages": ["en", "de", "fr", "it", "pt", "hi", "es", "th"],
"context_size": "128k",
"license": {
"name": "Meta",
"url": "https://github.com/meta-llama/llama-models/blob/main/models/llama3_1/LICENSE"
},
"model_config": {
"requires_api_key": true,
"premade_chat_template": true,
"eos_to_cull": "<\\|eot_id\\|>"
}
},{
"model_name": "Llama-3.1-8B-Instruct-4bit",
"backend": "huggingface_local",
"huggingface_id": "meta-llama/Meta-Llama-3.1-8B-Instruct",
"release_date": "2024-07-23",
"open_weight": true,
"parameters": "8B",
"languages": ["en", "de", "fr", "it", "pt", "hi", "es", "th"],
"context_size": "128k",
"license": {
"name": "Meta",
"url": "https://github.com/meta-llama/llama-models/blob/main/models/llama3_1/LICENSE"
},
"model_config": {
"requires_api_key": true,
"premade_chat_template": true,
"eos_to_cull": "<\\|eot_id\\|>",
"load_in_4bit": true
}
}, {
"model_name": "llama3-8b-sft",
"backend": "huggingface_local",
"huggingface_id": "meta-llama/Meta-Llama-3.1-8B-Instruct",
"release_date": "2024-07-23",
"open_weight": true,
"parameters": "8B",
"languages": ["en", "de", "fr", "it", "pt", "hi", "es", "th"],
"context_size": "128k",
"license": {
"name": "Meta",
"url": "https://github.com/meta-llama/llama-models/blob/main/models/llama3_1/LICENSE"
},
"model_config": {
"peft_model": "models/sft+lora/llama3-8b/checkpoint-78",
"requires_api_key": true,
"premade_chat_template": true,
"eos_to_cull": "<\\|eot_id\\|>"
}
}, {
"model_name": "gpt4o-mini",
"model_id": "gpt-4o-mini-2024-07-18",
"backend": "openai",
"release_date": "2024-07-18",
"open_weight": false,
"parameters": "",
"languages": [
"en", "es", "fr", "de", "it", "pt", "ru", "zh", "ja", "ko", "ar", "hi", "bn", "te", "ta", "ml", "kn", "gu", "mr",
"pa", "ur", "vi", "th", "id", "ms", "tl", "sw", "yo", "zu", "tr", "he", "fa", "uk", "pl", "cs", "hu", "ro", "nl",
"sv", "no", "da", "fi", "el", "bg", "sr", "hr", "sk", "is"
],
"context_size": "128k",
"license": {
"name": "OpenAI",
"url": "https://openai.com/policies/row-terms-of-use/"
},
"model_config": {
"multimodality": {
"single_image": true,
"multiple_images": true,
"audio": false,
"video": false
}
}
}
]