Skip to content

Commit 83fb5b8

Browse files
committed
tmp
1 parent 770184d commit 83fb5b8

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

src/llama-kv-cache.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ bool llama_kv_cache_init(
3232

3333
cache.recurrent = llama_model_is_recurrent(&model);
3434
cache.v_trans = !cache.recurrent && !cparams.flash_attn;
35-
cache.can_shift = !cache.recurrent; // not supported due to MLA
35+
cache.can_shift = !cache.recurrent && model.arch != LLM_ARCH_DEEPSEEK2; // not supported due to MLA
3636

3737
LLAMA_LOG_INFO("%s: kv_size = %d, offload = %d, type_k = '%s', type_v = '%s', n_layer = %d, can_shift = %d\n",
3838
__func__, kv_size, offload, ggml_type_name(type_k), ggml_type_name(type_v), n_layer, cache.can_shift);

0 commit comments

Comments
 (0)