File tree Expand file tree Collapse file tree 2 files changed +7
-4
lines changed Expand file tree Collapse file tree 2 files changed +7
-4
lines changed Original file line number Diff line number Diff line change @@ -66,6 +66,7 @@ const char * llm_type_name(llm_type type) {
6666 case LLM_TYPE_1_7B: return "1.7B";
6767 case LLM_TYPE_1_8B: return "1.8B";
6868 case LLM_TYPE_2B: return "2B";
69+ case LLM_TYPE_2_6B: return "2.6B";
6970 case LLM_TYPE_2_8B: return "2.8B";
7071 case LLM_TYPE_2_9B: return "2.9B";
7172 case LLM_TYPE_3B: return "3B";
@@ -1977,10 +1978,11 @@ void llama_model::load_hparams(llama_model_loader & ml) {
19771978 for (uint32_t il = 0; il < hparams.n_layer; ++il) {
19781979 hparams.recurrent_layer_arr[il] = hparams.n_head_kv(il) == 0;
19791980 }
1980- switch (hparams.n_embd) {
1981- case 1024: type = LLM_TYPE_350M; break;
1982- case 1536: type = LLM_TYPE_700M; break;
1983- case 2048: type = LLM_TYPE_1_2B; break;
1981+ switch (hparams.n_ff()) {
1982+ case 4608: type = LLM_TYPE_350M; break;
1983+ case 6912: type = LLM_TYPE_700M; break;
1984+ case 8192: type = LLM_TYPE_1_2B; break;
1985+ case 10752: type = LLM_TYPE_2_6B; break;
19841986 default: type = LLM_TYPE_UNKNOWN;
19851987 }
19861988 } break;
Original file line number Diff line number Diff line change @@ -58,6 +58,7 @@ enum llm_type {
5858 LLM_TYPE_1_7B,
5959 LLM_TYPE_1_8B,
6060 LLM_TYPE_2B,
61+ LLM_TYPE_2_6B,
6162 LLM_TYPE_2_8B,
6263 LLM_TYPE_2_9B,
6364 LLM_TYPE_3B,
You can’t perform that action at this time.
0 commit comments