Skip to content

Commit ef0b5c4

Browse files
committed
fix
1 parent 1647e2b commit ef0b5c4

File tree

1 file changed

+1
-2
lines changed

1 file changed

+1
-2
lines changed

src/llama.cpp

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -614,9 +614,8 @@ static struct ggml_tensor * llm_build_kqv(
614614
ggml_flash_attn_ext_set_prec(cur, GGML_PREC_F32);
615615

616616
if (n_embd_head_v < n_embd_head_k) {
617-
cur = ggml_cont(ctx, ggml_view_3d(ctx, ggml_cont(ctx, cur), n_embd_head_v, n_head, n_tokens,
617+
cur = ggml_cont(ctx, ggml_view_2d(ctx, ggml_cont(ctx, cur), n_embd_head_v*n_head, n_tokens,
618618
ggml_element_size(cur) * n_embd_head_v_out,
619-
ggml_element_size(cur) * n_embd_head_v_out * n_head,
620619
0));
621620
}
622621

0 commit comments

Comments
 (0)