Skip to content

Commit 0528bea

Browse files
author
wangzaijun
committed
fix cpu kv kernel bug
1 parent f902b18 commit 0528bea

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

lightllm/common/basemodel/triton_kernel/kv_cache_offload.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -252,7 +252,7 @@ def offload_gpu_kv_to_cpu(
252252
layer_num=gpu_kv_cache.shape[0],
253253
head_dim=head_dim,
254254
block_num=page_num,
255-
cpu_k_start_head_index=cpu_v_start_head_index,
255+
cpu_k_start_head_index=cpu_k_start_head_index,
256256
cpu_k_head_num=cpu_k_head_num,
257257
gpu_k_start_head_index=gpu_k_start_head_index,
258258
gpu_k_head_num=gpu_k_head_num,
@@ -509,7 +509,7 @@ def load_cpu_kv_to_gpu(
509509
cpu_stride4=cpu_kv_cache.stride(4),
510510
layer_num=gpu_kv_cache.shape[0],
511511
head_dim=head_dim,
512-
cpu_k_start_head_index=cpu_v_start_head_index,
512+
cpu_k_start_head_index=cpu_k_start_head_index,
513513
cpu_k_head_num=cpu_k_head_num,
514514
gpu_k_start_head_index=gpu_k_start_head_index,
515515
gpu_k_head_num=gpu_k_head_num,

0 commit comments

Comments
 (0)