-
Notifications
You must be signed in to change notification settings - Fork 40
Expand file tree
/
Copy pathmodel_registry.cpp
More file actions
111 lines (96 loc) · 4.21 KB
/
model_registry.cpp
File metadata and controls
111 lines (96 loc) · 4.21 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
#include "model_registry.h"
#include <glog/logging.h>
// list all registered models here
#include "huggingface/aquila.h" // IWYU pragma: keep
#include "huggingface/baichuan.h" // IWYU pargma: keep
#include "huggingface/bloom.h" // IWYU pragma: keep
#include "huggingface/chatglm.h" // IWYU pragma: keep
#include "huggingface/gemma.h" // IWYU pragma: keep
#include "huggingface/gpt2.h" // IWYU pragma: keep
#include "huggingface/gpt_j.h" // IWYU pragma: keep
#include "huggingface/gpt_neox.h" // IWYU pragma: keep
#include "huggingface/internlm.h" // IWYU pragma: keep
#include "huggingface/llama.h" // IWYU pragma: keep
#include "huggingface/mistral.h" // IWYU pragma: keep
#include "huggingface/mixtral.h" // IWYU pragma: keep
#include "huggingface/mpt.h" // IWYU pragma: keep
#include "huggingface/phi.h" // IWYU pragma: keep
#include "huggingface/qwen.h" // IWYU pragma: keep
#include "huggingface/yi.h" // IWYU pragma: keep
#include "llama.h" // IWYU pragma: keep
namespace llm {
ModelRegistry* ModelRegistry::get_instance() {
static ModelRegistry registry;
return ®istry;
}
void ModelRegistry::register_causallm_factory(const std::string& name,
CausalLMFactory factory) {
ModelRegistry* instance = get_instance();
if (instance->model_registry_[name].causal_lm_factory != nullptr) {
LOG(WARNING) << "causal lm factory for " << name << "already registered.";
} else {
instance->model_registry_[name].causal_lm_factory = factory;
}
}
void ModelRegistry::register_model_args_loader(const std::string& name,
ModelArgsLoader loader) {
ModelRegistry* instance = get_instance();
if (instance->model_registry_[name].model_args_loader != nullptr) {
LOG(WARNING) << "model args loader for " << name << "already registered.";
} else {
instance->model_registry_[name].model_args_loader = loader;
}
}
void ModelRegistry::register_quant_args_loader(const std::string& name,
QuantArgsLoader loader) {
ModelRegistry* instance = get_instance();
if (instance->model_registry_[name].quant_args_loader != nullptr) {
LOG(WARNING) << "quant args loader for " << name << "already registered.";
} else {
instance->model_registry_[name].quant_args_loader = loader;
}
}
void ModelRegistry::register_tokenizer_args_loader(const std::string& name,
TokenizerArgsLoader loader) {
ModelRegistry* instance = get_instance();
if (instance->model_registry_[name].tokenizer_args_loader != nullptr) {
LOG(WARNING) << "tokenizer args loader for " << name
<< "already registered.";
} else {
instance->model_registry_[name].tokenizer_args_loader = loader;
}
}
void ModelRegistry::register_default_chat_template_factory(
const std::string& name,
ChatTemplateFactory factory) {
ModelRegistry* instance = get_instance();
if (instance->model_registry_[name].chat_template_factory != nullptr) {
LOG(WARNING) << "conversation template for " << name
<< "already registered.";
} else {
instance->model_registry_[name].chat_template_factory = factory;
}
}
CausalLMFactory ModelRegistry::get_causallm_factory(const std::string& name) {
ModelRegistry* instance = get_instance();
return instance->model_registry_[name].causal_lm_factory;
}
ModelArgsLoader ModelRegistry::get_model_args_loader(const std::string& name) {
ModelRegistry* instance = get_instance();
return instance->model_registry_[name].model_args_loader;
}
QuantArgsLoader ModelRegistry::get_quant_args_loader(const std::string& name) {
ModelRegistry* instance = get_instance();
return instance->model_registry_[name].quant_args_loader;
}
TokenizerArgsLoader ModelRegistry::get_tokenizer_args_loader(
const std::string& name) {
ModelRegistry* instance = get_instance();
return instance->model_registry_[name].tokenizer_args_loader;
}
ChatTemplateFactory ModelRegistry::get_default_chat_template_factory(
const std::string& name) {
ModelRegistry* instance = get_instance();
return instance->model_registry_[name].chat_template_factory;
}
} // namespace llm