@@ -80,6 +80,7 @@ static const std::map<llm_arch, const char *> LLM_ARCH_NAMES = {
8080 { LLM_ARCH_ARCEE, " arcee" },
8181 { LLM_ARCH_ERNIE4_5, " ernie4_5" },
8282 { LLM_ARCH_HUNYUAN_MOE, " hunyuan-moe" },
83+ { LLM_ARCH_SMOLLM3, " smollm3" },
8384 { LLM_ARCH_UNKNOWN, " (unknown)" },
8485};
8586
@@ -1749,6 +1750,23 @@ static const std::map<llm_arch, std::map<llm_tensor, const char *>> LLM_TENSOR_N
17491750 { LLM_TENSOR_TOKEN_EMBD, " token_embd" },
17501751 },
17511752 },
1753+ {
1754+ LLM_ARCH_SMOLLM3,
1755+ {
1756+ { LLM_TENSOR_TOKEN_EMBD, " token_embd" },
1757+ { LLM_TENSOR_OUTPUT_NORM, " output_norm" },
1758+ { LLM_TENSOR_OUTPUT, " output" },
1759+ { LLM_TENSOR_ATTN_NORM, " blk.%d.attn_norm" },
1760+ { LLM_TENSOR_ATTN_Q, " blk.%d.attn_q" },
1761+ { LLM_TENSOR_ATTN_K, " blk.%d.attn_k" },
1762+ { LLM_TENSOR_ATTN_V, " blk.%d.attn_v" },
1763+ { LLM_TENSOR_ATTN_OUT, " blk.%d.attn_output" },
1764+ { LLM_TENSOR_FFN_NORM, " blk.%d.ffn_norm" },
1765+ { LLM_TENSOR_FFN_GATE, " blk.%d.ffn_gate" },
1766+ { LLM_TENSOR_FFN_DOWN, " blk.%d.ffn_down" },
1767+ { LLM_TENSOR_FFN_UP, " blk.%d.ffn_up" },
1768+ },
1769+ },
17521770};
17531771
17541772static const std::map<llm_tensor, llm_tensor_info> LLM_TENSOR_INFOS = {
0 commit comments