We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0fed24c commit 8b91d53Copy full SHA for 8b91d53
src/llama-model.cpp
@@ -4440,8 +4440,8 @@ struct llm_build_llama : public llm_graph_context {
4440
4441
if (arch == LLM_ARCH_LLAMA4 && use_rope && hparams.use_kq_norm) {
4442
// Llama4TextL2Norm
4443
- Qcur = ggml_rms_norm(ctx0, Qcur, 1e-6);
4444
- Kcur = ggml_rms_norm(ctx0, Kcur, 1e-6);
+ Qcur = ggml_rms_norm(ctx0, Qcur, hparams.f_norm_rms_eps);
+ Kcur = ggml_rms_norm(ctx0, Kcur, hparams.f_norm_rms_eps);
4445
cb(Qcur, "Qcur_normed", il);
4446
cb(Kcur, "Kcur_normed", il);
4447
}
0 commit comments