Skip to content

Commit c62c354

Browse files
committed
cont : minor fix [no ci]
1 parent 3dec397 commit c62c354

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/llama-kv-cache.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -318,9 +318,9 @@ class llama_kv_cache_context : public llama_memory_context_i {
318318

319319
// store k_cur and v_cur in the cache based on the provided head location
320320
// - k_cur [n_embd_head_k, n_head_k, n_tokens]
321-
// - k_idxs [n_batch]
321+
// - k_idxs [n_tokens]
322322
// - v_cur [n_embd_head_v, n_head_v, n_tokens]
323-
// - v_idxs [n_batch] or [n_batch*n_embd_v_gqa] depending if V cache is transposed
323+
// - v_idxs [n_tokens] or [n_tokens*n_embd_v_gqa] depending if V cache is transposed
324324
ggml_tensor * cpy_k(ggml_context * ctx, ggml_tensor * k_cur, ggml_tensor * k_idxs, int32_t il) const;
325325
ggml_tensor * cpy_v(ggml_context * ctx, ggml_tensor * v_cur, ggml_tensor * v_idxs, int32_t il) const;
326326

0 commit comments

Comments
 (0)