cont : minor fix [no ci]

ggerganov · ggerganov · commit c62c354f4f51 · 2025-09-08T09:49:05.000+03:00
diff --git a/src/llama-kv-cache.h b/src/llama-kv-cache.h
@@ -318,9 +318,9 @@ class llama_kv_cache_context : public llama_memory_context_i {
 
     // store k_cur and v_cur in the cache based on the provided head location
     //   - k_cur  [n_embd_head_k, n_head_k, n_tokens]
-    //   - k_idxs [n_batch]
+    //   - k_idxs [n_tokens]
     //   - v_cur  [n_embd_head_v, n_head_v, n_tokens]
-    //   - v_idxs [n_batch] or [n_batch*n_embd_v_gqa] depending if V cache is transposed
+    //   - v_idxs [n_tokens] or [n_tokens*n_embd_v_gqa] depending if V cache is transposed
     ggml_tensor * cpy_k(ggml_context * ctx, ggml_tensor * k_cur, ggml_tensor * k_idxs, int32_t il) const;
     ggml_tensor * cpy_v(ggml_context * ctx, ggml_tensor * v_cur, ggml_tensor * v_idxs, int32_t il) const;