We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 848cade commit 892bbc6Copy full SHA for 892bbc6
src/llama.cpp
@@ -605,11 +605,11 @@ static struct ggml_tensor * llm_build_kqv(
605
606
if (n_embd_head_v < n_embd_head_k) {
607
LLAMA_LOG_INFO("cur shape: [%ld, %ld, %ld]\n", cur->ne[0], cur->ne[1], cur->ne[2]);
608
- cur = ggml_reshape_3d(ctx, cur, n_head, n_embd_head_v_out, n_tokens);
+ cur = ggml_reshape_3d(ctx, cur, n_head, n_tokens, n_embd_head_v_out);
609
610
- cur = ggml_cont(ctx, ggml_view_3d(ctx, cur, n_head, n_embd_head_v, n_tokens,
+ cur = ggml_cont(ctx, ggml_view_3d(ctx, cur, n_head, n_tokens, n_embd_head_v,
611
ggml_element_size(cur) * n_head,
612
- ggml_element_size(cur) * n_embd_head_v_out * n_head,
+ ggml_element_size(cur) * n_head * n_tokens,
613
0));
614
615
}
0 commit comments