Skip to content

Commit d4d1522

Browse files
authored
llama : add model type detection for rwkv7 7B&14B (ggml-org#14816)
Signed-off-by: Molly Sophia <[email protected]>
1 parent d1aa0cc commit d4d1522

File tree

1 file changed

+16
-2
lines changed

1 file changed

+16
-2
lines changed

src/llama-model.cpp

Lines changed: 16 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1544,7 +1544,11 @@ void llama_model::load_hparams(llama_model_loader & ml) {
15441544
ml.get_key(LLM_KV_TOKEN_SHIFT_COUNT, hparams.token_shift_count, false);
15451545

15461546
switch (hparams.n_layer) {
1547-
case 12: type = LLM_TYPE_190M; break;
1547+
case 12:
1548+
switch (hparams.n_embd) {
1549+
case 768: type = LLM_TYPE_190M; break;
1550+
default: type = LLM_TYPE_UNKNOWN;
1551+
} break;
15481552
case 24:
15491553
switch (hparams.n_embd) {
15501554
case 1024: type = LLM_TYPE_450M; break;
@@ -1557,7 +1561,17 @@ void llama_model::load_hparams(llama_model_loader & ml) {
15571561
case 3584: type = LLM_TYPE_7B; break;
15581562
default: type = LLM_TYPE_UNKNOWN;
15591563
} break;
1560-
case 32: type = LLM_TYPE_2_9B; break; // RWKV-7-World
1564+
case 32:
1565+
switch (hparams.n_embd) {
1566+
case 2560: type = LLM_TYPE_2_9B; break;
1567+
case 4096: type = LLM_TYPE_7B; break;
1568+
default: type = LLM_TYPE_UNKNOWN;
1569+
} break;
1570+
case 61:
1571+
switch (hparams.n_embd) {
1572+
case 4096: type = LLM_TYPE_14B; break;
1573+
default: type = LLM_TYPE_UNKNOWN;
1574+
} break;
15611575
default: type = LLM_TYPE_UNKNOWN;
15621576
}
15631577
} break;

0 commit comments

Comments
 (0)