Skip to content

Commit 0518461

Browse files
authored
cont vCur
1 parent 3c4423c commit 0518461

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

src/llama-model.cpp

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10175,6 +10175,9 @@ struct llm_build_deepseek2 : public llm_graph_context {
1017510175
ggml_tensor * Vcur = kv_cmpr;
1017610176
cb(Vcur, "Vcur", il);
1017710177

10178+
Vcur = ggml_cont(ctx0, Vcur);
10179+
cb(Vcur, "Vcur_cont", il);
10180+
1017810181
// note: MLA with the absorption optimzation converts into MQA (ie: GQA with 1 group)
1017910182
cur = build_attn(inp_attn, gf,
1018010183
model.layers[il].wo, NULL,

0 commit comments

Comments
 (0)