ggml-org
diff --git a/‎src/models/baichuan.cpp‎
Lines changed: 0 additions & 5 deletions b/‎src/models/baichuan.cpp‎
Lines changed: 0 additions & 5 deletions
diff --git a/‎src/models/gemma.cpp‎
Lines changed: 0 additions & 4 deletions b/‎src/models/gemma.cpp‎
Lines changed: 0 additions & 4 deletions
diff --git a/‎src/models/gemma2_iswa.cpp‎
Lines changed: 0 additions & 4 deletions b/‎src/models/gemma2_iswa.cpp‎
Lines changed: 0 additions & 4 deletions
diff --git a/‎src/models/gemma3_iswa.cpp‎
Lines changed: 0 additions & 5 deletions b/‎src/models/gemma3_iswa.cpp‎
Lines changed: 0 additions & 5 deletions
diff --git a/‎src/models/glm4_moe.cpp‎
Lines changed: 0 additions & 5 deletions b/‎src/models/glm4_moe.cpp‎
Lines changed: 0 additions & 5 deletions
diff --git a/‎src/models/gptneox.cpp‎
Lines changed: 0 additions & 3 deletions b/‎src/models/gptneox.cpp‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎src/models/granite.cpp‎
Lines changed: 0 additions & 8 deletions b/‎src/models/granite.cpp‎
Lines changed: 0 additions & 8 deletions
diff --git a/‎src/models/grok.cpp‎
Lines changed: 0 additions & 8 deletions b/‎src/models/grok.cpp‎
Lines changed: 0 additions & 8 deletions
diff --git a/‎src/models/hunyuan_moe.cpp‎
Lines changed: 0 additions & 6 deletions b/‎src/models/hunyuan_moe.cpp‎
Lines changed: 0 additions & 6 deletions
diff --git a/‎src/models/internlm2.cpp‎
Lines changed: 0 additions & 6 deletions b/‎src/models/internlm2.cpp‎
Lines changed: 0 additions & 6 deletions
@@ -61,7 +61,6 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap
                 default:
                     GGML_ABORT("fatal error");
             }
-;
 
             cb(Qcur, "Qcur", il);
             cb(Kcur, "Kcur", il);
@@ -71,13 +70,11 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap
                     model.layers[il].wo, NULL,
                     Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f/sqrtf(float(n_embd_head)), il);
         }
-;
 
         if (il == n_layer - 1 && inp_out_ids) {
             cur   = ggml_get_rows(ctx0,   cur, inp_out_ids);
             inpSA = ggml_get_rows(ctx0, inpSA, inp_out_ids);
         }
-;
 
         ggml_tensor * ffn_inp = ggml_add(ctx0, cur, inpSA);
         cb(ffn_inp, "ffn_inp", il);
@@ -97,7 +94,6 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap
                     LLM_FFN_SILU, LLM_FFN_PAR, il);
             cb(cur, "ffn_out", il);
         }
-;
 
         cur = ggml_add(ctx0, cur, ffn_inp);
 
@@ -107,7 +103,6 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap
         // input for next layer
         inpL = cur;
     }
-;
 
     cur = inpL;
 
 
@@ -64,12 +64,10 @@ llm_build_gemma::llm_build_gemma(const llama_model & model, const llm_graph_para
                     model.layers[il].wo, NULL,
                     Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f, il);
         }
-;
         if (il == n_layer - 1 && inp_out_ids) {
             cur  = ggml_get_rows(ctx0,  cur, inp_out_ids);
             inpL = ggml_get_rows(ctx0, inpL, inp_out_ids);
         }
-;
         ggml_tensor * sa_out = ggml_add(ctx0, cur, inpL);
         cb(sa_out, "sa_out", il);
 
@@ -88,7 +86,6 @@ llm_build_gemma::llm_build_gemma(const llama_model & model, const llm_graph_para
                     LLM_FFN_GELU, LLM_FFN_PAR, il);
             cb(cur, "ffn_out", il);
         }
-;
         cur = ggml_add(ctx0, cur, sa_out);
 
         cur = build_cvec(cur, il);
@@ -97,7 +94,6 @@ llm_build_gemma::llm_build_gemma(const llama_model & model, const llm_graph_para
         // input for next layer
         inpL = cur;
     }
-;
     cur = inpL;
 
     cur = build_norm(cur,
 
@@ -62,12 +62,10 @@ llm_build_gemma2_iswa::llm_build_gemma2_iswa(const llama_model & model, const ll
                         model.layers[il].wo, NULL,
                         Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f, il);
             }
-;
             if (il == n_layer - 1 && inp_out_ids) {
                 cur  = ggml_get_rows(ctx0,  cur, inp_out_ids);
                 inpL = ggml_get_rows(ctx0, inpL, inp_out_ids);
             }
-;
             cur = build_norm(cur,
                     model.layers[il].attn_post_norm, NULL,
                     LLM_NORM_RMS, il);
@@ -91,7 +89,6 @@ llm_build_gemma2_iswa::llm_build_gemma2_iswa(const llama_model & model, const ll
                         LLM_FFN_GELU, LLM_FFN_PAR, il);
                 cb(cur, "ffn_out", il);
             }
-;
             cur = build_norm(cur,
                     model.layers[il].ffn_post_norm, NULL,
                     LLM_NORM_RMS, -1);
@@ -105,7 +102,6 @@ llm_build_gemma2_iswa::llm_build_gemma2_iswa(const llama_model & model, const ll
             // input for next layer
             inpL = cur;
         }
-;
         cur = inpL;
 
         cur = build_norm(cur,
 
@@ -14,7 +14,6 @@ llm_build_gemma3_iswa::llm_build_gemma3_iswa(const llama_model & model, const ll
             inpL = ggml_scale(ctx0, inpL, sqrtf(n_embd));
             cb(inpL, "inp_scaled", -1);
         }
-;
         // inp_pos - contains the positions
         ggml_tensor * inp_pos = build_inp_pos();
 
@@ -74,12 +73,10 @@ llm_build_gemma3_iswa::llm_build_gemma3_iswa(const llama_model & model, const ll
                         model.layers[il].wo, NULL,
                         Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f, il);
             }
-;
             if (il == n_layer - 1 && inp_out_ids) {
                 cur  = ggml_get_rows(ctx0,  cur, inp_out_ids);
                 inpL = ggml_get_rows(ctx0, inpL, inp_out_ids);
             }
-;
             cur = build_norm(cur,
                     model.layers[il].attn_post_norm, NULL,
                     LLM_NORM_RMS, il);
@@ -103,7 +100,6 @@ llm_build_gemma3_iswa::llm_build_gemma3_iswa(const llama_model & model, const ll
                         LLM_FFN_GELU, LLM_FFN_PAR, il);
                 cb(cur, "ffn_out", il);
             }
-;
             cur = build_norm(cur,
                     model.layers[il].ffn_post_norm, NULL,
                     LLM_NORM_RMS, -1);
@@ -117,7 +113,6 @@ llm_build_gemma3_iswa::llm_build_gemma3_iswa(const llama_model & model, const ll
             // input for next layer
             inpL = cur;
         }
-;
         cur = inpL;
 
         cur = build_norm(cur,
 
@@ -61,7 +61,6 @@ llm_build_glm4_moe::llm_build_glm4_moe(const llama_model & model, const llm_grap
                     Kcur = build_norm(Kcur, model.layers[il].attn_k_norm, NULL, LLM_NORM_RMS, il);
                     cb(Kcur, "Kcur_normed", il);
                 }
-;
                 Qcur = ggml_rope_ext(
                         ctx0, Qcur, inp_pos, nullptr,
                         n_rot, rope_type, n_ctx_orig, freq_base, freq_scale,
@@ -82,12 +81,10 @@ llm_build_glm4_moe::llm_build_glm4_moe(const llama_model & model, const llm_grap
                         model.layers[il].wo, NULL,
                         Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f/sqrtf(float(n_embd_head)), il);
             }
-;
             if (il == n_transformer_layers - 1 && inp_out_ids) {
                 cur   = ggml_get_rows(ctx0, cur, inp_out_ids);
                 inpSA = ggml_get_rows(ctx0, inpSA, inp_out_ids);
             }
-;
             ggml_tensor * ffn_inp = ggml_add(ctx0, cur, inpSA);
             cb(ffn_inp, "ffn_inp", il);
 
@@ -133,7 +130,6 @@ llm_build_glm4_moe::llm_build_glm4_moe(const llama_model & model, const llm_grap
                 cur = ggml_add(ctx0, routed_out, shared_out);
                 cb(cur, "ffn_out", il);
             }
-;
             cur = ggml_add(ctx0, cur, ffn_inp);
 
             cur = build_cvec(cur, il);
@@ -142,7 +138,6 @@ llm_build_glm4_moe::llm_build_glm4_moe(const llama_model & model, const llm_grap
             // input for next layer
             inpL = cur;
         }
-;
         cur = inpL;
         cur = build_norm(cur, model.output_norm, NULL, LLM_NORM_RMS, -1);
 
 
@@ -59,13 +59,11 @@ llm_build_gptneox::llm_build_gptneox(const llama_model & model, const llm_graph_
                     model.layers[il].wo, model.layers[il].bo,
                     Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f/sqrtf(float(n_embd_head)), il);
         }
-;
 
         if (il == n_layer - 1 && inp_out_ids) {
             cur  = ggml_get_rows(ctx0,  cur, inp_out_ids);
             inpL = ggml_get_rows(ctx0, inpL, inp_out_ids);
         }
-;
 
         // ffn
         if (hparams.use_par_res) {
@@ -129,7 +127,6 @@ llm_build_gptneox::llm_build_gptneox(const llama_model & model, const llm_graph_
             inpL = cur;
         }
     }
-;
 
     cur = build_norm(inpL,
             model.output_norm,
 
@@ -22,7 +22,6 @@ llm_build_granite::llm_build_granite(
     if (hparams.rope_finetuned) {
         inp_pos = build_inp_pos();
     }
-;
     auto * inp_attn = build_attn_inp_kv();
 
     ggml_tensor * inp_out_ids = build_inp_out_ids();
@@ -45,14 +44,12 @@ llm_build_granite::llm_build_granite(
             cur   = ggml_get_rows(ctx0,   cur, inp_out_ids);
             inpSA = ggml_get_rows(ctx0, inpSA, inp_out_ids);
         }
-;
         // ffn
         cur = build_layer_ffn(cur, inpSA, model, il);
 
         // input for next layer
         inpL = cur;
     }
-;
     cur = inpL;
 
     cur = build_norm(cur,
@@ -88,23 +85,20 @@ ggml_tensor * llm_build_granite::build_attention_layer(
         Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);
         cb(Qcur, "Qcur", il);
     }
-;
 
     ggml_tensor * Kcur = build_lora_mm(model.layers[il].wk, cur);
     cb(Kcur, "Kcur", il);
     if (model.layers[il].bk) {
         Kcur = ggml_add(ctx0, Kcur, model.layers[il].bk);
         cb(Kcur, "Kcur", il);
     }
-;
 
     ggml_tensor * Vcur = build_lora_mm(model.layers[il].wv, cur);
     cb(Vcur, "Vcur", il);
     if (model.layers[il].bv) {
         Vcur = ggml_add(ctx0, Vcur, model.layers[il].bv);
         cb(Vcur, "Vcur", il);
     }
-;
 
     Qcur = ggml_reshape_3d(ctx0, Qcur, n_embd_head, hparams.n_head(il),    n_tokens);
     Kcur = ggml_reshape_3d(ctx0, Kcur, n_embd_head, hparams.n_head_kv(il), n_tokens);
@@ -125,7 +119,6 @@ ggml_tensor * llm_build_granite::build_attention_layer(
                 ext_factor, attn_factor, beta_fast, beta_slow
                 );
     }
-;
 
     cb(Qcur, "Qcur", il);
     cb(Kcur, "Kcur", il);
@@ -204,7 +197,6 @@ ggml_tensor * llm_build_granite::build_layer_ffn(
             cur = moe_out;
         }
     }
-;
 
     // For Granite architectures - scale residual
     if (hparams.f_residual_scale) {
 
@@ -38,21 +38,18 @@ llm_build_grok::llm_build_grok(const llama_model & model, const llm_graph_params
                     Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);
                     cb(Qcur, "Qcur", il);
                 }
-;
                 ggml_tensor * Kcur = build_lora_mm(model.layers[il].wk, cur);
                 cb(Kcur, "Kcur", il);
                 if (model.layers[il].bk) {
                     Kcur = ggml_add(ctx0, Kcur, model.layers[il].bk);
                     cb(Kcur, "Kcur", il);
                 }
-;
                 ggml_tensor * Vcur = build_lora_mm(model.layers[il].wv, cur);
                 cb(Vcur, "Vcur", il);
                 if (model.layers[il].bv) {
                     Vcur = ggml_add(ctx0, Vcur, model.layers[il].bv);
                     cb(Vcur, "Vcur", il);
                 }
-;
                 Qcur = ggml_reshape_3d(ctx0, Qcur, n_embd_head, n_head,    n_tokens);
                 Kcur = ggml_reshape_3d(ctx0, Kcur, n_embd_head, n_head_kv, n_tokens);
                 Vcur = ggml_reshape_3d(ctx0, Vcur, n_embd_head, n_head_kv, n_tokens);
@@ -77,12 +74,10 @@ llm_build_grok::llm_build_grok(const llama_model & model, const llm_graph_params
                         model.layers[il].wo, model.layers[il].bo,
                         Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f, il);
             }
-;
             if (il == n_layer - 1 && inp_out_ids) {
                 cur   = ggml_get_rows(ctx0,   cur, inp_out_ids);
                 inpSA = ggml_get_rows(ctx0, inpSA, inp_out_ids);
             }
-;
             cur = build_norm(cur,
                     model.layers[il].attn_out_norm, NULL,
                     LLM_NORM_RMS, il);
@@ -125,7 +120,6 @@ llm_build_grok::llm_build_grok(const llama_model & model, const llm_graph_params
             } else {
                 cur = moe_out;
             }
-;
             cur = build_norm(cur,
                     model.layers[il].ffn_post_norm, NULL,
                     LLM_NORM_RMS, il);
@@ -140,7 +134,6 @@ llm_build_grok::llm_build_grok(const llama_model & model, const llm_graph_params
             // input for next layer
             inpL = cur;
         }
-;
         cur = inpL;
 
         cur = build_norm(cur,
@@ -161,7 +154,6 @@ llm_build_grok::llm_build_grok(const llama_model & model, const llm_graph_params
             cur = ggml_tanh(ctx0, cur);
             cur = ggml_scale(ctx0, cur, hparams.f_final_logit_softcapping);
         }
-;
         cb(cur, "result_output", -1);
         res->t_logits = cur;
 
 
@@ -42,21 +42,18 @@ llm_build_hunyuan_moe::llm_build_hunyuan_moe(const llama_model & model, const ll
                     Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);
                     cb(Qcur, "Qcur", il);
                 }
-;
                 ggml_tensor * Kcur = build_lora_mm(model.layers[il].wk, cur);
                 cb(Kcur, "Kcur", il);
                 if (model.layers[il].bk) {
                     Kcur = ggml_add(ctx0, Kcur, model.layers[il].bk);
                     cb(Kcur, "Kcur", il);
                 }
-;
                 ggml_tensor * Vcur = build_lora_mm(model.layers[il].wv, cur);
                 cb(Vcur, "Vcur", il);
                 if (model.layers[il].bv) {
                     Vcur = ggml_add(ctx0, Vcur, model.layers[il].bv);
                     cb(Vcur, "Vcur", il);
                 }
-;
                 Qcur = ggml_reshape_3d(ctx0, Qcur, n_embd_head, n_head,    n_tokens);
                 Kcur = ggml_reshape_3d(ctx0, Kcur, n_embd_head, n_head_kv, n_tokens);
                 Vcur = ggml_reshape_3d(ctx0, Vcur, n_embd_head, n_head_kv, n_tokens);
@@ -92,12 +89,10 @@ llm_build_hunyuan_moe::llm_build_hunyuan_moe(const llama_model & model, const ll
                         Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, kq_scale, il);
                 cb(cur, "attn_out", il);
             }
-;
             if (il == n_layer - 1 && inp_out_ids) {
                 cur   = ggml_get_rows(ctx0,   cur, inp_out_ids);
                 inpSA = ggml_get_rows(ctx0, inpSA, inp_out_ids);
             }
-;
             ggml_tensor * ffn_inp = ggml_add(ctx0, cur, inpSA);
             cb(ffn_inp, "ffn_inp", il);
 
@@ -142,7 +137,6 @@ llm_build_hunyuan_moe::llm_build_hunyuan_moe(const llama_model & model, const ll
             // input for next layer
             inpL = cur;
         }
-;
         cur = inpL;
 
         cur = build_norm(cur,
 
@@ -38,21 +38,18 @@ llm_build_internlm2::llm_build_internlm2(const llama_model & model, const llm_gr
                     Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);
                     cb(Qcur, "Qcur", il);
                 }
-;
                 ggml_tensor * Kcur = build_lora_mm(model.layers[il].wk, cur);
                 cb(Kcur, "Kcur", il);
                 if (model.layers[il].bk) {
                     Kcur = ggml_add(ctx0, Kcur, model.layers[il].bk);
                     cb(Kcur, "Kcur", il);
                 }
-;
                 ggml_tensor * Vcur = build_lora_mm(model.layers[il].wv, cur);
                 cb(Vcur, "Vcur", il);
                 if (model.layers[il].bv) {
                     Vcur = ggml_add(ctx0, Vcur, model.layers[il].bv);
                     cb(Vcur, "Vcur", il);
                 }
-;
                 Qcur = ggml_reshape_3d(ctx0, Qcur, n_embd_head, n_head,    n_tokens);
                 Kcur = ggml_reshape_3d(ctx0, Kcur, n_embd_head, n_head_kv, n_tokens);
                 Vcur = ggml_reshape_3d(ctx0, Vcur, n_embd_head, n_head_kv, n_tokens);
@@ -77,12 +74,10 @@ llm_build_internlm2::llm_build_internlm2(const llama_model & model, const llm_gr
                         model.layers[il].wo, model.layers[il].bo,
                         Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f/sqrtf(float(n_embd_head)), il);
             }
-;
             if (il == n_layer - 1 && inp_out_ids) {
                 cur   = ggml_get_rows(ctx0,   cur, inp_out_ids);
                 inpSA = ggml_get_rows(ctx0, inpSA, inp_out_ids);
             }
-;
             ggml_tensor * ffn_inp = ggml_add(ctx0, cur, inpSA);
             cb(ffn_inp, "ffn_inp", il);
 
@@ -108,7 +103,6 @@ llm_build_internlm2::llm_build_internlm2(const llama_model & model, const llm_gr
             // input for next layer
             inpL = cur;
         }
-;
         cur = inpL;
 
         cur = build_norm(cur,
Original file line number	Diff line number	Diff line change
`@@ -61,7 +61,6 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap`
`61`	`61`	`default:`
`62`	`62`	`GGML_ABORT("fatal error");`
`63`	`63`	`}`
`64`		`-;`
`65`	`64`
`66`	`65`	`cb(Qcur, "Qcur", il);`
`67`	`66`	`cb(Kcur, "Kcur", il);`
`@@ -71,13 +70,11 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap`
`71`	`70`	`model.layers[il].wo, NULL,`
`72`	`71`	`Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f/sqrtf(float(n_embd_head)), il);`
`73`	`72`	`}`
`74`		`-;`
`75`	`73`
`76`	`74`	`if (il == n_layer - 1 && inp_out_ids) {`
`77`	`75`	`cur = ggml_get_rows(ctx0, cur, inp_out_ids);`
`78`	`76`	`inpSA = ggml_get_rows(ctx0, inpSA, inp_out_ids);`
`79`	`77`	`}`
`80`		`-;`
`81`	`78`
`82`	`79`	`ggml_tensor * ffn_inp = ggml_add(ctx0, cur, inpSA);`
`83`	`80`	`cb(ffn_inp, "ffn_inp", il);`
`@@ -97,7 +94,6 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap`
`97`	`94`	`LLM_FFN_SILU, LLM_FFN_PAR, il);`
`98`	`95`	`cb(cur, "ffn_out", il);`
`99`	`96`	`}`
`100`		`-;`
`101`	`97`
`102`	`98`	`cur = ggml_add(ctx0, cur, ffn_inp);`
`103`	`99`
`@@ -107,7 +103,6 @@ llm_build_baichuan::llm_build_baichuan(const llama_model & model, const llm_grap`
`107`	`103`	`// input for next layer`
`108`	`104`	`inpL = cur;`
`109`	`105`	`}`
`110`		`-;`
`111`	`106`
`112`	`107`	`cur = inpL;`
`113`	`108`
Original file line number	Diff line number	Diff line change
`@@ -64,12 +64,10 @@ llm_build_gemma::llm_build_gemma(const llama_model & model, const llm_graph_para`
`64`	`64`	`model.layers[il].wo, NULL,`
`65`	`65`	`Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f, il);`
`66`	`66`	`}`
`67`		`-;`
`68`	`67`	`if (il == n_layer - 1 && inp_out_ids) {`
`69`	`68`	`cur = ggml_get_rows(ctx0, cur, inp_out_ids);`
`70`	`69`	`inpL = ggml_get_rows(ctx0, inpL, inp_out_ids);`
`71`	`70`	`}`
`72`		`-;`
`73`	`71`	`ggml_tensor * sa_out = ggml_add(ctx0, cur, inpL);`
`74`	`72`	`cb(sa_out, "sa_out", il);`
`75`	`73`
`@@ -88,7 +86,6 @@ llm_build_gemma::llm_build_gemma(const llama_model & model, const llm_graph_para`
`88`	`86`	`LLM_FFN_GELU, LLM_FFN_PAR, il);`
`89`	`87`	`cb(cur, "ffn_out", il);`
`90`	`88`	`}`
`91`		`-;`
`92`	`89`	`cur = ggml_add(ctx0, cur, sa_out);`
`93`	`90`
`94`	`91`	`cur = build_cvec(cur, il);`
`@@ -97,7 +94,6 @@ llm_build_gemma::llm_build_gemma(const llama_model & model, const llm_graph_para`
`97`	`94`	`// input for next layer`
`98`	`95`	`inpL = cur;`
`99`	`96`	`}`
`100`		`-;`
`101`	`97`	`cur = inpL;`
`102`	`98`
`103`	`99`	`cur = build_norm(cur,`
Original file line number	Diff line number	Diff line change
`@@ -59,13 +59,11 @@ llm_build_gptneox::llm_build_gptneox(const llama_model & model, const llm_graph_`
`59`	`59`	`model.layers[il].wo, model.layers[il].bo,`
`60`	`60`	`Qcur, Kcur, Vcur, nullptr, nullptr, nullptr, 1.0f/sqrtf(float(n_embd_head)), il);`
`61`	`61`	`}`
`62`		`-;`
`63`	`62`
`64`	`63`	`if (il == n_layer - 1 && inp_out_ids) {`
`65`	`64`	`cur = ggml_get_rows(ctx0, cur, inp_out_ids);`
`66`	`65`	`inpL = ggml_get_rows(ctx0, inpL, inp_out_ids);`
`67`	`66`	`}`
`68`		`-;`
`69`	`67`
`70`	`68`	`// ffn`
`71`	`69`	`if (hparams.use_par_res) {`
`@@ -129,7 +127,6 @@ llm_build_gptneox::llm_build_gptneox(const llama_model & model, const llm_graph_`
`129`	`127`	`inpL = cur;`
`130`	`128`	`}`
`131`	`129`	`}`
`132`		`-;`
`133`	`130`
`134`	`131`	`cur = build_norm(inpL,`
`135`	`132`	`model.output_norm,`