We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6cf16aa commit 4abde12Copy full SHA for 4abde12
src/llama-context.cpp
@@ -70,6 +70,10 @@ llama_context::llama_context(
70
cparams.yarn_ext_factor = rope_scaling_type == LLAMA_ROPE_SCALING_TYPE_YARN ? 1.0f : 0.0f;
71
}
72
73
+ if (model.arch == LLM_ARCH_GROK && params.yarn_beta_fast == 32.0f) {
74
+ cparams.yarn_beta_fast = 8.0f;
75
+ }
76
+
77
cparams.yarn_attn_factor *= hparams.rope_attn_factor;
78
79
if (cparams.pooling_type == LLAMA_POOLING_TYPE_UNSPECIFIED) {
0 commit comments