Skip to content

Commit eec8dad

Browse files
committed
fix
1 parent b0778a6 commit eec8dad

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

src/llama.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -604,8 +604,10 @@ static struct ggml_tensor * llm_build_kqv(
604604
ggml_flash_attn_ext_set_prec(cur, GGML_PREC_F32);
605605

606606
if (n_embd_head_v < n_embd_head_k) {
607-
cur = ggml_cont(ctx, ggml_view_2d(ctx, ggml_cont(ctx, cur), n_embd_head_v*n_head, n_tokens,
607+
cur = ggml_cont(ctx, cur);
608+
cur = ggml_cont(ctx, ggml_view_3d(ctx, cur, n_embd_head_v, n_head, n_tokens,
608609
ggml_element_size(cur) * n_embd_head_v_out,
610+
ggml_element_size(cur) * n_embd_head_v_out * n_head,
609611
0));
610612
}
611613

0 commit comments

Comments
 (0)