@@ -13828,12 +13828,13 @@ struct llm_build_smollm3 : public llm_graph_context {
1382813828 LLM_NORM_RMS, il);
1382913829 cb(ffn_cur, "ffn_norm", il);
1383013830
13831- ffn_cur = build_ffn(ffn_cur,
13832- model.layers[il].ffn_up, NULL, NULL,
13833- model.layers[il].ffn_gate, NULL, NULL,
13834- model.layers[il].ffn_down, NULL, NULL,
13835- NULL,
13836- LLM_FFN_SILU, LLM_FFN_PAR, il);
13831+ ffn_cur = build_ffn(
13832+ ffn_cur,
13833+ model.layers[il].ffn_up, model.layers[il].ffn_up_b, nullptr,
13834+ model.layers[il].ffn_gate, model.layers[il].ffn_gate_b, nullptr,
13835+ model.layers[il].ffn_down, model.layers[il].ffn_down_b, nullptr,
13836+ nullptr,
13837+ LLM_FFN_SILU, LLM_FFN_PAR, il);
1383713838 cb(ffn_cur, "ffn_out", il);
1383813839
1383913840 cur = ggml_add(ctx0, cur, ffn_cur);
@@ -13848,13 +13849,14 @@ struct llm_build_smollm3 : public llm_graph_context {
1384813849 LLM_NORM_RMS, il);
1384913850 cb(cur, "ffn_norm", il);
1385013851
13851- cur = build_ffn(cur,
13852- model.layers[il].ffn_up, NULL, NULL,
13853- model.layers[il].ffn_gate, NULL, NULL,
13854- model.layers[il].ffn_down, NULL, NULL,
13855- NULL,
13856- LLM_FFN_SILU, LLM_FFN_PAR, il);
13857- cb(cur, "ffn_out", il);
13852+ cur = build_ffn(
13853+ cur,
13854+ model.layers[il].ffn_up, model.layers[il].ffn_up_b, nullptr,
13855+ model.layers[il].ffn_gate, model.layers[il].ffn_gate_b, nullptr,
13856+ model.layers[il].ffn_down, model.layers[il].ffn_down_b, nullptr,
13857+ nullptr,
13858+ LLM_FFN_SILU, LLM_FFN_PAR, il);
13859+ cb(cur, "ffn_out", il);
1385813860
1385913861 cur = ggml_add(ctx0, cur, ffn_inp);
1386013862 cb(cur, "ffn_out", il);
0 commit comments