Skip to content

Commit b140f03

Browse files
committed
fix MoE norm_w
1 parent 27a440e commit b140f03

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/llama-model.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5380,8 +5380,8 @@ struct llm_build_bert : public llm_graph_context {
53805380
hparams.n_expert,
53815381
hparams.n_expert_used,
53825382
LLM_FFN_GELU,
5383-
true, false,
5384-
0.0f,
5383+
/*norm_w*/ model.arch != LLM_ARCH_NOMIC_BERT_MOE,
5384+
false, 0.0f,
53855385
LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX, il);
53865386
cb(cur, "ffn_moe_out", il);
53875387
} else if (model.arch == LLM_ARCH_BERT || model.arch == LLM_ARCH_NOMIC_BERT_MOE) {

0 commit comments

Comments
 (0)