We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 27a440e commit b140f03Copy full SHA for b140f03
src/llama-model.cpp
@@ -5380,8 +5380,8 @@ struct llm_build_bert : public llm_graph_context {
5380
hparams.n_expert,
5381
hparams.n_expert_used,
5382
LLM_FFN_GELU,
5383
- true, false,
5384
- 0.0f,
+ /*norm_w*/ model.arch != LLM_ARCH_NOMIC_BERT_MOE,
+ false, 0.0f,
5385
LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX, il);
5386
cb(cur, "ffn_moe_out", il);
5387
} else if (model.arch == LLM_ARCH_BERT || model.arch == LLM_ARCH_NOMIC_BERT_MOE) {
0 commit comments