File tree Expand file tree Collapse file tree 1 file changed +2
-5
lines changed Expand file tree Collapse file tree 1 file changed +2
-5
lines changed Original file line number Diff line number Diff line change @@ -340,11 +340,8 @@ class llama_kv_cache_recurrent : public llama_kv_cache {
340340 void state_write (llama_io_write_i & io, llama_seq_id seq_id = -1 ) const override ;
341341 void state_read (llama_io_read_i & io, llama_seq_id seq_id = -1 ) override ;
342342
343- // Note: The value of head isn't only used to optimize searching
344- // for a free KV slot. llama_decode_impl also uses it, so it
345- // cannot be freely changed after a slot has been allocated.
346- uint32_t head = 0 ;
347- uint32_t size = 0 ;
343+ uint32_t head = 0 ; // the location where the batch will be placed in the cache (see find_slot())
344+ uint32_t size = 0 ; // total number of cells, shared across all sequences
348345 uint32_t used = 0 ; // used cells (i.e. at least one seq_id)
349346
350347 // computed before each graph build
You can’t perform that action at this time.
0 commit comments